blob: 6e8bfab4c3544b491e4565f0e9cfd81d295f2009 [file] [log] [blame]
Tim Shen158e51b2018-04-23 21:54:06 +00001// -*- C++ -*-
Louis Dionne9bd93882021-11-17 16:25:01 -05002//===----------------------------------------------------------------------===//
Tim Shen158e51b2018-04-23 21:54:06 +00003//
Chandler Carruthd2012102019-01-19 10:56:40 +00004// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
5// See https://llvm.org/LICENSE.txt for license information.
6// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Tim Shen158e51b2018-04-23 21:54:06 +00007//
8//===----------------------------------------------------------------------===//
9#ifndef _LIBCPP_EXPERIMENTAL_SIMD
10#define _LIBCPP_EXPERIMENTAL_SIMD
11
12/*
13 experimental/simd synopsis
14
15namespace std::experimental {
16
17inline namespace parallelism_v2 {
18
19namespace simd_abi {
20
21struct scalar {};
22template <int N> struct fixed_size {};
23template <typename T> inline constexpr int max_fixed_size = implementation-defined;
24template <typename T> using compatible = implementation-defined;
25template <typename T> using native = implementation-defined;
26
27} // simd_abi
28
29struct element_aligned_tag {};
30struct vector_aligned_tag {};
31template <size_t> struct overaligned_tag {};
32inline constexpr element_aligned_tag element_aligned{};
33inline constexpr vector_aligned_tag vector_aligned{};
34template <size_t N> inline constexpr overaligned_tag<N> overaligned{};
35
36// traits [simd.traits]
37template <class T> struct is_abi_tag;
38template <class T> inline constexpr bool is_abi_tag_v = is_abi_tag<T>::value;
39
40template <class T> struct is_simd;
41template <class T> inline constexpr bool is_simd_v = is_simd<T>::value;
42
43template <class T> struct is_simd_mask;
44template <class T> inline constexpr bool is_simd_mask_v = is_simd_mask<T>::value;
45
46template <class T> struct is_simd_flag_type;
47template <class T> inline constexpr bool is_simd_flag_type_v = is_simd_flag_type<T>::value;
48
49template <class T, size_t N> struct abi_for_size { using type = see below; };
50template <class T, size_t N> using abi_for_size_t = typename abi_for_size<T, N>::type;
51
52template <class T, class Abi = simd_abi::compatible<T>> struct simd_size;
53template <class T, class Abi = simd_abi::compatible<T>>
54inline constexpr size_t simd_size_v = simd_size<T, Abi>::value;
55
56template <class T, class U = typename T::value_type> struct memory_alignment;
57template <class T, class U = typename T::value_type>
58inline constexpr size_t memory_alignment_v = memory_alignment<T, U>::value;
59
60// class template simd [simd.class]
61template <class T, class Abi = simd_abi::compatible<T>> class simd;
62template <class T> using native_simd = simd<T, simd_abi::native<T>>;
63template <class T, int N> using fixed_size_simd = simd<T, simd_abi::fixed_size<N>>;
64
65// class template simd_mask [simd.mask.class]
66template <class T, class Abi = simd_abi::compatible<T>> class simd_mask;
67template <class T> using native_simd_mask = simd_mask<T, simd_abi::native<T>>;
68template <class T, int N> using fixed_size_simd_mask = simd_mask<T, simd_abi::fixed_size<N>>;
69
70// casts [simd.casts]
71template <class T, class U, class Abi> see below simd_cast(const simd<U, Abi>&);
72template <class T, class U, class Abi> see below static_simd_cast(const simd<U, Abi>&);
73
74template <class T, class Abi>
75fixed_size_simd<T, simd_size_v<T, Abi>> to_fixed_size(const simd<T, Abi>&) noexcept;
76template <class T, class Abi>
77fixed_size_simd_mask<T, simd_size_v<T, Abi>> to_fixed_size(const simd_mask<T, Abi>&) noexcept;
78template <class T, size_t N> native_simd<T> to_native(const fixed_size_simd<T, N>&) noexcept;
79template <class T, size_t N>
80native_simd_mask<T> to_native(const fixed_size_simd_mask<T, N>> &) noexcept;
81template <class T, size_t N> simd<T> to_compatible(const fixed_size_simd<T, N>&) noexcept;
82template <class T, size_t N> simd_mask<T> to_compatible(const fixed_size_simd_mask<T, N>&) noexcept;
83
84template <size_t... Sizes, class T, class Abi>
85tuple<simd<T, abi_for_size_t<Sizes>>...> split(const simd<T, Abi>&);
86template <size_t... Sizes, class T, class Abi>
87tuple<simd_mask<T, abi_for_size_t<Sizes>>...> split(const simd_mask<T, Abi>&);
88template <class V, class Abi>
89array<V, simd_size_v<typename V::value_type, Abi> / V::size()> split(
90const simd<typename V::value_type, Abi>&);
91template <class V, class Abi>
92array<V, simd_size_v<typename V::value_type, Abi> / V::size()> split(
93const simd_mask<typename V::value_type, Abi>&);
94
95template <class T, class... Abis>
96simd<T, abi_for_size_t<T, (simd_size_v<T, Abis> + ...)>> concat(const simd<T, Abis>&...);
97template <class T, class... Abis>
98simd_mask<T, abi_for_size_t<T, (simd_size_v<T, Abis> + ...)>> concat(const simd_mask<T, Abis>&...);
99
100// reductions [simd.mask.reductions]
101template <class T, class Abi> bool all_of(const simd_mask<T, Abi>&) noexcept;
102template <class T, class Abi> bool any_of(const simd_mask<T, Abi>&) noexcept;
103template <class T, class Abi> bool none_of(const simd_mask<T, Abi>&) noexcept;
104template <class T, class Abi> bool some_of(const simd_mask<T, Abi>&) noexcept;
105template <class T, class Abi> int popcount(const simd_mask<T, Abi>&) noexcept;
106template <class T, class Abi> int find_first_set(const simd_mask<T, Abi>&);
107template <class T, class Abi> int find_last_set(const simd_mask<T, Abi>&);
108
109bool all_of(see below) noexcept;
110bool any_of(see below) noexcept;
111bool none_of(see below) noexcept;
112bool some_of(see below) noexcept;
113int popcount(see below) noexcept;
114int find_first_set(see below) noexcept;
115int find_last_set(see below) noexcept;
116
117// masked assignment [simd.whereexpr]
118template <class M, class T> class const_where_expression;
119template <class M, class T> class where_expression;
120
121// masked assignment [simd.mask.where]
122template <class T> struct nodeduce { using type = T; }; // exposition only
123
124template <class T> using nodeduce_t = typename nodeduce<T>::type; // exposition only
125
126template <class T, class Abi>
127where_expression<simd_mask<T, Abi>, simd<T, Abi>>
128where(const typename simd<T, Abi>::mask_type&, simd<T, Abi>&) noexcept;
129
130template <class T, class Abi>
131const_where_expression<simd_mask<T, Abi>, const simd<T, Abi>>
132where(const typename simd<T, Abi>::mask_type&, const simd<T, Abi>&) noexcept;
133
134template <class T, class Abi>
135where_expression<simd_mask<T, Abi>, simd_mask<T, Abi>>
136where(const nodeduce_t<simd_mask<T, Abi>>&, simd_mask<T, Abi>&) noexcept;
137
138template <class T, class Abi>
139const_where_expression<simd_mask<T, Abi>, const simd_mask<T, Abi>>
140where(const nodeduce_t<simd_mask<T, Abi>>&, const simd_mask<T, Abi>&) noexcept;
141
142template <class T> where_expression<bool, T> where(see below k, T& d) noexcept;
143
144template <class T>
145const_where_expression<bool, const T> where(see below k, const T& d) noexcept;
146
147// reductions [simd.reductions]
148template <class T, class Abi, class BinaryOperation = std::plus<>>
149T reduce(const simd<T, Abi>&, BinaryOperation = BinaryOperation());
150
151template <class M, class V, class BinaryOperation>
152typename V::value_type reduce(const const_where_expression<M, V>& x,
153typename V::value_type neutral_element, BinaryOperation binary_op);
154
155template <class M, class V>
156typename V::value_type reduce(const const_where_expression<M, V>& x, plus<> binary_op = plus<>());
157
158template <class M, class V>
159typename V::value_type reduce(const const_where_expression<M, V>& x, multiplies<> binary_op);
160
161template <class M, class V>
162typename V::value_type reduce(const const_where_expression<M, V>& x, bit_and<> binary_op);
163
164template <class M, class V>
165typename V::value_type reduce(const const_where_expression<M, V>& x, bit_or<> binary_op);
166
167template <class M, class V>
168typename V::value_type reduce(const const_where_expression<M, V>& x, bit_xor<> binary_op);
169
170template <class T, class Abi> T hmin(const simd<T, Abi>&);
171template <class M, class V> T hmin(const const_where_expression<M, V>&);
172template <class T, class Abi> T hmax(const simd<T, Abi>&);
173template <class M, class V> T hmax(const const_where_expression<M, V>&);
174
175// algorithms [simd.alg]
176template <class T, class Abi> simd<T, Abi> min(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
177
178template <class T, class Abi> simd<T, Abi> max(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
179
180template <class T, class Abi>
181std::pair<simd<T, Abi>, simd<T, Abi>> minmax(const simd<T, Abi>&, const simd<T, Abi>&) noexcept;
182
183template <class T, class Abi>
184simd<T, Abi> clamp(const simd<T, Abi>& v, const simd<T, Abi>& lo, const simd<T, Abi>& hi);
185
186// [simd.whereexpr]
187template <class M, class T>
188class const_where_expression {
189 const M& mask; // exposition only
190 T& data; // exposition only
191public:
192 const_where_expression(const const_where_expression&) = delete;
193 const_where_expression& operator=(const const_where_expression&) = delete;
194 remove_const_t<T> operator-() const &&;
195 template <class U, class Flags> void copy_to(U* mem, Flags f) const &&;
196};
197
198template <class M, class T>
199class where_expression : public const_where_expression<M, T> {
200public:
201 where_expression(const where_expression&) = delete;
202 where_expression& operator=(const where_expression&) = delete;
203 template <class U> void operator=(U&& x);
204 template <class U> void operator+=(U&& x);
205 template <class U> void operator-=(U&& x);
206 template <class U> void operator*=(U&& x);
207 template <class U> void operator/=(U&& x);
208 template <class U> void operator%=(U&& x);
209 template <class U> void operator&=(U&& x);
210 template <class U> void operator|=(U&& x);
211 template <class U> void operator^=(U&& x);
212 template <class U> void operator<<=(U&& x);
213 template <class U> void operator>>=(U&& x);
214 void operator++();
215 void operator++(int);
216 void operator--();
217 void operator--(int);
218 template <class U, class Flags> void copy_from(const U* mem, Flags);
219};
220
221// [simd.class]
222template <class T, class Abi> class simd {
223public:
224 using value_type = T;
225 using reference = see below;
226 using mask_type = simd_mask<T, Abi>;
227
228 using abi_type = Abi;
229 static constexpr size_t size() noexcept;
230 simd() = default;
231
232 // implicit type conversion constructor
233 template <class U> simd(const simd<U, simd_abi::fixed_size<size()>>&);
234
235 // implicit broadcast constructor (see below for constraints)
236 template <class U> simd(U&& value);
237
238 // generator constructor (see below for constraints)
239 template <class G> explicit simd(G&& gen);
240
241 // load constructor
242 template <class U, class Flags> simd(const U* mem, Flags f);
243
244 // loads [simd.load]
245 template <class U, class Flags> void copy_from(const U* mem, Flags f);
246
247 // stores [simd.store]
248 template <class U, class Flags> void copy_to(U* mem, Flags f) const;
249
250 // scalar access [simd.subscr]
251 reference operator[](size_t);
252 value_type operator[](size_t) const;
253
254 // unary operators [simd.unary]
255 simd& operator++();
256 simd operator++(int);
257 simd& operator--();
258 simd operator--(int);
259 mask_type operator!() const;
260 simd operator~() const; // see below
261 simd operator+() const;
262 simd operator-() const;
263
264 // binary operators [simd.binary]
265 friend simd operator+ (const simd&, const simd&);
266 friend simd operator- (const simd&, const simd&);
267 friend simd operator* (const simd&, const simd&);
268 friend simd operator/ (const simd&, const simd&);
269 friend simd operator% (const simd&, const simd&);
270 friend simd operator& (const simd&, const simd&);
271 friend simd operator| (const simd&, const simd&);
272 friend simd operator^ (const simd&, const simd&);
273 friend simd operator<<(const simd&, const simd&);
274 friend simd operator>>(const simd&, const simd&);
275 friend simd operator<<(const simd&, int);
276 friend simd operator>>(const simd&, int);
277
278 // compound assignment [simd.cassign]
279 friend simd& operator+= (simd&, const simd&);
280 friend simd& operator-= (simd&, const simd&);
281 friend simd& operator*= (simd&, const simd&);
282 friend simd& operator/= (simd&, const simd&);
283 friend simd& operator%= (simd&, const simd&);
284
285 friend simd& operator&= (simd&, const simd&);
286 friend simd& operator|= (simd&, const simd&);
287 friend simd& operator^= (simd&, const simd&);
288 friend simd& operator<<=(simd&, const simd&);
289 friend simd& operator>>=(simd&, const simd&);
290 friend simd& operator<<=(simd&, int);
291 friend simd& operator>>=(simd&, int);
292
293 // compares [simd.comparison]
294 friend mask_type operator==(const simd&, const simd&);
295 friend mask_type operator!=(const simd&, const simd&);
296 friend mask_type operator>=(const simd&, const simd&);
297 friend mask_type operator<=(const simd&, const simd&);
298 friend mask_type operator> (const simd&, const simd&);
299 friend mask_type operator< (const simd&, const simd&);
300};
301
302// [simd.math]
303template <class Abi> using scharv = simd<signed char, Abi>; // exposition only
304template <class Abi> using shortv = simd<short, Abi>; // exposition only
305template <class Abi> using intv = simd<int, Abi>; // exposition only
306template <class Abi> using longv = simd<long int, Abi>; // exposition only
307template <class Abi> using llongv = simd<long long int, Abi>; // exposition only
308template <class Abi> using floatv = simd<float, Abi>; // exposition only
309template <class Abi> using doublev = simd<double, Abi>; // exposition only
310template <class Abi> using ldoublev = simd<long double, Abi>; // exposition only
311template <class T, class V> using samesize = fixed_size_simd<T, V::size()>; // exposition only
312
313template <class Abi> floatv<Abi> acos(floatv<Abi> x);
314template <class Abi> doublev<Abi> acos(doublev<Abi> x);
315template <class Abi> ldoublev<Abi> acos(ldoublev<Abi> x);
316
317template <class Abi> floatv<Abi> asin(floatv<Abi> x);
318template <class Abi> doublev<Abi> asin(doublev<Abi> x);
319template <class Abi> ldoublev<Abi> asin(ldoublev<Abi> x);
320
321template <class Abi> floatv<Abi> atan(floatv<Abi> x);
322template <class Abi> doublev<Abi> atan(doublev<Abi> x);
323template <class Abi> ldoublev<Abi> atan(ldoublev<Abi> x);
324
325template <class Abi> floatv<Abi> atan2(floatv<Abi> y, floatv<Abi> x);
326template <class Abi> doublev<Abi> atan2(doublev<Abi> y, doublev<Abi> x);
327template <class Abi> ldoublev<Abi> atan2(ldoublev<Abi> y, ldoublev<Abi> x);
328
329template <class Abi> floatv<Abi> cos(floatv<Abi> x);
330template <class Abi> doublev<Abi> cos(doublev<Abi> x);
331template <class Abi> ldoublev<Abi> cos(ldoublev<Abi> x);
332
333template <class Abi> floatv<Abi> sin(floatv<Abi> x);
334template <class Abi> doublev<Abi> sin(doublev<Abi> x);
335template <class Abi> ldoublev<Abi> sin(ldoublev<Abi> x);
336
337template <class Abi> floatv<Abi> tan(floatv<Abi> x);
338template <class Abi> doublev<Abi> tan(doublev<Abi> x);
339template <class Abi> ldoublev<Abi> tan(ldoublev<Abi> x);
340
341template <class Abi> floatv<Abi> acosh(floatv<Abi> x);
342template <class Abi> doublev<Abi> acosh(doublev<Abi> x);
343template <class Abi> ldoublev<Abi> acosh(ldoublev<Abi> x);
344
345template <class Abi> floatv<Abi> asinh(floatv<Abi> x);
346template <class Abi> doublev<Abi> asinh(doublev<Abi> x);
347template <class Abi> ldoublev<Abi> asinh(ldoublev<Abi> x);
348
349template <class Abi> floatv<Abi> atanh(floatv<Abi> x);
350template <class Abi> doublev<Abi> atanh(doublev<Abi> x);
351template <class Abi> ldoublev<Abi> atanh(ldoublev<Abi> x);
352
353template <class Abi> floatv<Abi> cosh(floatv<Abi> x);
354template <class Abi> doublev<Abi> cosh(doublev<Abi> x);
355template <class Abi> ldoublev<Abi> cosh(ldoublev<Abi> x);
356
357template <class Abi> floatv<Abi> sinh(floatv<Abi> x);
358template <class Abi> doublev<Abi> sinh(doublev<Abi> x);
359template <class Abi> ldoublev<Abi> sinh(ldoublev<Abi> x);
360
361template <class Abi> floatv<Abi> tanh(floatv<Abi> x);
362template <class Abi> doublev<Abi> tanh(doublev<Abi> x);
363template <class Abi> ldoublev<Abi> tanh(ldoublev<Abi> x);
364
365template <class Abi> floatv<Abi> exp(floatv<Abi> x);
366template <class Abi> doublev<Abi> exp(doublev<Abi> x);
367template <class Abi> ldoublev<Abi> exp(ldoublev<Abi> x);
368
369template <class Abi> floatv<Abi> exp2(floatv<Abi> x);
370template <class Abi> doublev<Abi> exp2(doublev<Abi> x);
371template <class Abi> ldoublev<Abi> exp2(ldoublev<Abi> x);
372
373template <class Abi> floatv<Abi> expm1(floatv<Abi> x);
374template <class Abi> doublev<Abi> expm1(doublev<Abi> x);
375template <class Abi> ldoublev<Abi> expm1(ldoublev<Abi> x);
376
377template <class Abi> floatv<Abi> frexp(floatv<Abi> value, samesize<int, floatv<Abi>>* exp);
378template <class Abi> doublev<Abi> frexp(doublev<Abi> value, samesize<int, doublev<Abi>>* exp);
379template <class Abi> ldoublev<Abi> frexp(ldoublev<Abi> value, samesize<int, ldoublev<Abi>>* exp);
380
381template <class Abi> samesize<int, floatv<Abi>> ilogb(floatv<Abi> x);
382template <class Abi> samesize<int, doublev<Abi>> ilogb(doublev<Abi> x);
383template <class Abi> samesize<int, ldoublev<Abi>> ilogb(ldoublev<Abi> x);
384
385template <class Abi> floatv<Abi> ldexp(floatv<Abi> x, samesize<int, floatv<Abi>> exp);
386template <class Abi> doublev<Abi> ldexp(doublev<Abi> x, samesize<int, doublev<Abi>> exp);
387template <class Abi> ldoublev<Abi> ldexp(ldoublev<Abi> x, samesize<int, ldoublev<Abi>> exp);
388
389template <class Abi> floatv<Abi> log(floatv<Abi> x);
390template <class Abi> doublev<Abi> log(doublev<Abi> x);
391template <class Abi> ldoublev<Abi> log(ldoublev<Abi> x);
392
393template <class Abi> floatv<Abi> log10(floatv<Abi> x);
394template <class Abi> doublev<Abi> log10(doublev<Abi> x);
395template <class Abi> ldoublev<Abi> log10(ldoublev<Abi> x);
396
397template <class Abi> floatv<Abi> log1p(floatv<Abi> x);
398template <class Abi> doublev<Abi> log1p(doublev<Abi> x);
399template <class Abi> ldoublev<Abi> log1p(ldoublev<Abi> x);
400
401template <class Abi> floatv<Abi> log2(floatv<Abi> x);
402template <class Abi> doublev<Abi> log2(doublev<Abi> x);
403template <class Abi> ldoublev<Abi> log2(ldoublev<Abi> x);
404
405template <class Abi> floatv<Abi> logb(floatv<Abi> x);
406template <class Abi> doublev<Abi> logb(doublev<Abi> x);
407template <class Abi> ldoublev<Abi> logb(ldoublev<Abi> x);
408
409template <class Abi> floatv<Abi> modf(floatv<Abi> value, floatv<Abi>* iptr);
410template <class Abi> doublev<Abi> modf(doublev<Abi> value, doublev<Abi>* iptr);
411template <class Abi> ldoublev<Abi> modf(ldoublev<Abi> value, ldoublev<Abi>* iptr);
412
413template <class Abi> floatv<Abi> scalbn(floatv<Abi> x, samesize<int, floatv<Abi>> n);
414template <class Abi> doublev<Abi> scalbn(doublev<Abi> x, samesize<int, doublev<Abi>> n);
415template <class Abi> ldoublev<Abi> scalbn(ldoublev<Abi> x, samesize<int, ldoublev<Abi>> n);
416template <class Abi> floatv<Abi> scalbln(floatv<Abi> x, samesize<long int, floatv<Abi>> n);
417template <class Abi> doublev<Abi> scalbln(doublev<Abi> x, samesize<long int, doublev<Abi>> n);
418template <class Abi> ldoublev<Abi> scalbln(ldoublev<Abi> x, samesize<long int, ldoublev<Abi>> n);
419
420template <class Abi> floatv<Abi> cbrt(floatv<Abi> x);
421template <class Abi> doublev<Abi> cbrt(doublev<Abi> x);
422template <class Abi> ldoublev<Abi> cbrt(ldoublev<Abi> x);
423
424template <class Abi> scharv<Abi> abs(scharv<Abi> j);
425template <class Abi> shortv<Abi> abs(shortv<Abi> j);
426template <class Abi> intv<Abi> abs(intv<Abi> j);
427template <class Abi> longv<Abi> abs(longv<Abi> j);
428template <class Abi> llongv<Abi> abs(llongv<Abi> j);
429template <class Abi> floatv<Abi> abs(floatv<Abi> j);
430template <class Abi> doublev<Abi> abs(doublev<Abi> j);
431template <class Abi> ldoublev<Abi> abs(ldoublev<Abi> j);
432
433template <class Abi> floatv<Abi> hypot(floatv<Abi> x, floatv<Abi> y);
434template <class Abi> doublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y);
435template <class Abi> ldoublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y);
436template <class Abi> floatv<Abi> hypot(floatv<Abi> x, floatv<Abi> y, floatv<Abi> z);
437template <class Abi> doublev<Abi> hypot(doublev<Abi> x, doublev<Abi> y, doublev<Abi> z);
438template <class Abi> ldoublev<Abi> hypot(ldoublev<Abi> x, ldoublev<Abi> y, ldoublev<Abi> z);
439
440template <class Abi> floatv<Abi> pow(floatv<Abi> x, floatv<Abi> y);
441template <class Abi> doublev<Abi> pow(doublev<Abi> x, doublev<Abi> y);
442template <class Abi> ldoublev<Abi> pow(ldoublev<Abi> x, ldoublev<Abi> y);
443
444template <class Abi> floatv<Abi> sqrt(floatv<Abi> x);
445template <class Abi> doublev<Abi> sqrt(doublev<Abi> x);
446template <class Abi> ldoublev<Abi> sqrt(ldoublev<Abi> x);
447
448template <class Abi> floatv<Abi> erf(floatv<Abi> x);
449template <class Abi> doublev<Abi> erf(doublev<Abi> x);
450template <class Abi> ldoublev<Abi> erf(ldoublev<Abi> x);
451template <class Abi> floatv<Abi> erfc(floatv<Abi> x);
452template <class Abi> doublev<Abi> erfc(doublev<Abi> x);
453template <class Abi> ldoublev<Abi> erfc(ldoublev<Abi> x);
454
455template <class Abi> floatv<Abi> lgamma(floatv<Abi> x);
456template <class Abi> doublev<Abi> lgamma(doublev<Abi> x);
457template <class Abi> ldoublev<Abi> lgamma(ldoublev<Abi> x);
458
459template <class Abi> floatv<Abi> tgamma(floatv<Abi> x);
460template <class Abi> doublev<Abi> tgamma(doublev<Abi> x);
461template <class Abi> ldoublev<Abi> tgamma(ldoublev<Abi> x);
462
463template <class Abi> floatv<Abi> ceil(floatv<Abi> x);
464template <class Abi> doublev<Abi> ceil(doublev<Abi> x);
465template <class Abi> ldoublev<Abi> ceil(ldoublev<Abi> x);
466
467template <class Abi> floatv<Abi> floor(floatv<Abi> x);
468template <class Abi> doublev<Abi> floor(doublev<Abi> x);
469template <class Abi> ldoublev<Abi> floor(ldoublev<Abi> x);
470
471template <class Abi> floatv<Abi> nearbyint(floatv<Abi> x);
472template <class Abi> doublev<Abi> nearbyint(doublev<Abi> x);
473template <class Abi> ldoublev<Abi> nearbyint(ldoublev<Abi> x);
474
475template <class Abi> floatv<Abi> rint(floatv<Abi> x);
476template <class Abi> doublev<Abi> rint(doublev<Abi> x);
477template <class Abi> ldoublev<Abi> rint(ldoublev<Abi> x);
478
479template <class Abi> samesize<long int, floatv<Abi>> lrint(floatv<Abi> x);
480template <class Abi> samesize<long int, doublev<Abi>> lrint(doublev<Abi> x);
481template <class Abi> samesize<long int, ldoublev<Abi>> lrint(ldoublev<Abi> x);
482template <class Abi> samesize<long long int, floatv<Abi>> llrint(floatv<Abi> x);
483template <class Abi> samesize<long long int, doublev<Abi>> llrint(doublev<Abi> x);
484template <class Abi> samesize<long long int, ldoublev<Abi>> llrint(ldoublev<Abi> x);
485
486template <class Abi> floatv<Abi> round(floatv<Abi> x);
487template <class Abi> doublev<Abi> round(doublev<Abi> x);
488template <class Abi> ldoublev<Abi> round(ldoublev<Abi> x);
489template <class Abi> samesize<long int, floatv<Abi>> lround(floatv<Abi> x);
490template <class Abi> samesize<long int, doublev<Abi>> lround(doublev<Abi> x);
491template <class Abi> samesize<long int, ldoublev<Abi>> lround(ldoublev<Abi> x);
492template <class Abi> samesize<long long int, floatv<Abi>> llround(floatv<Abi> x);
493template <class Abi> samesize<long long int, doublev<Abi>> llround(doublev<Abi> x);
494template <class Abi> samesize<long long int, ldoublev<Abi>> llround(ldoublev<Abi> x);
495
496template <class Abi> floatv<Abi> trunc(floatv<Abi> x);
497template <class Abi> doublev<Abi> trunc(doublev<Abi> x);
498template <class Abi> ldoublev<Abi> trunc(ldoublev<Abi> x);
499
500template <class Abi> floatv<Abi> fmod(floatv<Abi> x, floatv<Abi> y);
501template <class Abi> doublev<Abi> fmod(doublev<Abi> x, doublev<Abi> y);
502template <class Abi> ldoublev<Abi> fmod(ldoublev<Abi> x, ldoublev<Abi> y);
503
504template <class Abi> floatv<Abi> remainder(floatv<Abi> x, floatv<Abi> y);
505template <class Abi> doublev<Abi> remainder(doublev<Abi> x, doublev<Abi> y);
506template <class Abi> ldoublev<Abi> remainder(ldoublev<Abi> x, ldoublev<Abi> y);
507
508template <class Abi> floatv<Abi> remquo(floatv<Abi> x, floatv<Abi> y, samesize<int, floatv<Abi>>* quo);
509template <class Abi> doublev<Abi> remquo(doublev<Abi> x, doublev<Abi> y, samesize<int, doublev<Abi>>* quo);
510template <class Abi> ldoublev<Abi> remquo(ldoublev<Abi> x, ldoublev<Abi> y, samesize<int, ldoublev<Abi>>* quo);
511
512template <class Abi> floatv<Abi> copysign(floatv<Abi> x, floatv<Abi> y);
513template <class Abi> doublev<Abi> copysign(doublev<Abi> x, doublev<Abi> y);
514template <class Abi> ldoublev<Abi> copysign(ldoublev<Abi> x, ldoublev<Abi> y);
515
516template <class Abi> doublev<Abi> nan(const char* tagp);
517template <class Abi> floatv<Abi> nanf(const char* tagp);
518template <class Abi> ldoublev<Abi> nanl(const char* tagp);
519
520template <class Abi> floatv<Abi> nextafter(floatv<Abi> x, floatv<Abi> y);
521template <class Abi> doublev<Abi> nextafter(doublev<Abi> x, doublev<Abi> y);
522template <class Abi> ldoublev<Abi> nextafter(ldoublev<Abi> x, ldoublev<Abi> y);
523
524template <class Abi> floatv<Abi> nexttoward(floatv<Abi> x, ldoublev<Abi> y);
525template <class Abi> doublev<Abi> nexttoward(doublev<Abi> x, ldoublev<Abi> y);
526template <class Abi> ldoublev<Abi> nexttoward(ldoublev<Abi> x, ldoublev<Abi> y);
527
528template <class Abi> floatv<Abi> fdim(floatv<Abi> x, floatv<Abi> y);
529template <class Abi> doublev<Abi> fdim(doublev<Abi> x, doublev<Abi> y);
530template <class Abi> ldoublev<Abi> fdim(ldoublev<Abi> x, ldoublev<Abi> y);
531
532template <class Abi> floatv<Abi> fmax(floatv<Abi> x, floatv<Abi> y);
533template <class Abi> doublev<Abi> fmax(doublev<Abi> x, doublev<Abi> y);
534template <class Abi> ldoublev<Abi> fmax(ldoublev<Abi> x, ldoublev<Abi> y);
535
536template <class Abi> floatv<Abi> fmin(floatv<Abi> x, floatv<Abi> y);
537template <class Abi> doublev<Abi> fmin(doublev<Abi> x, doublev<Abi> y);
538template <class Abi> ldoublev<Abi> fmin(ldoublev<Abi> x, ldoublev<Abi> y);
539
540template <class Abi> floatv<Abi> fma(floatv<Abi> x, floatv<Abi> y, floatv<Abi> z);
541template <class Abi> doublev<Abi> fma(doublev<Abi> x, doublev<Abi> y, doublev<Abi> z);
542template <class Abi> ldoublev<Abi> fma(ldoublev<Abi> x, ldoublev<Abi> y, ldoublev<Abi> z);
543
544template <class Abi> samesize<int, floatv<Abi>> fpclassify(floatv<Abi> x);
545template <class Abi> samesize<int, doublev<Abi>> fpclassify(doublev<Abi> x);
546template <class Abi> samesize<int, ldoublev<Abi>> fpclassify(ldoublev<Abi> x);
547
548template <class Abi> simd_mask<float, Abi> isfinite(floatv<Abi> x);
549template <class Abi> simd_mask<double, Abi> isfinite(doublev<Abi> x);
550template <class Abi> simd_mask<long double, Abi> isfinite(ldoublev<Abi> x);
551
552template <class Abi> simd_mask<float, Abi> isinf(floatv<Abi> x);
553template <class Abi> simd_mask<double, Abi> isinf(doublev<Abi> x);
554template <class Abi> simd_mask<long double, Abi> isinf(ldoublev<Abi> x);
555
556template <class Abi> simd_mask<float, Abi> isnan(floatv<Abi> x);
557template <class Abi> simd_mask<double, Abi> isnan(doublev<Abi> x);
558template <class Abi> simd_mask<long double, Abi> isnan(ldoublev<Abi> x);
559
560template <class Abi> simd_mask<float, Abi> isnormal(floatv<Abi> x);
561template <class Abi> simd_mask<double, Abi> isnormal(doublev<Abi> x);
562template <class Abi> simd_mask<long double, Abi> isnormal(ldoublev<Abi> x);
563
564template <class Abi> simd_mask<float, Abi> signbit(floatv<Abi> x);
565template <class Abi> simd_mask<double, Abi> signbit(doublev<Abi> x);
566template <class Abi> simd_mask<long double, Abi> signbit(ldoublev<Abi> x);
567
568template <class Abi> simd_mask<float, Abi> isgreater(floatv<Abi> x, floatv<Abi> y);
569template <class Abi> simd_mask<double, Abi> isgreater(doublev<Abi> x, doublev<Abi> y);
570template <class Abi> simd_mask<long double, Abi> isgreater(ldoublev<Abi> x, ldoublev<Abi> y);
571
572template <class Abi> simd_mask<float, Abi> isgreaterequal(floatv<Abi> x, floatv<Abi> y);
573template <class Abi> simd_mask<double, Abi> isgreaterequal(doublev<Abi> x, doublev<Abi> y);
574template <class Abi> simd_mask<long double, Abi> isgreaterequal(ldoublev<Abi> x, ldoublev<Abi> y);
575
576template <class Abi> simd_mask<float, Abi> isless(floatv<Abi> x, floatv<Abi> y);
577template <class Abi> simd_mask<double, Abi> isless(doublev<Abi> x, doublev<Abi> y);
578template <class Abi> simd_mask<long double, Abi> isless(ldoublev<Abi> x, ldoublev<Abi> y);
579
580template <class Abi> simd_mask<float, Abi> islessequal(floatv<Abi> x, floatv<Abi> y);
581template <class Abi> simd_mask<double, Abi> islessequal(doublev<Abi> x, doublev<Abi> y);
582template <class Abi> simd_mask<long double, Abi> islessequal(ldoublev<Abi> x, ldoublev<Abi> y);
583
584template <class Abi> simd_mask<float, Abi> islessgreater(floatv<Abi> x, floatv<Abi> y);
585template <class Abi> simd_mask<double, Abi> islessgreater(doublev<Abi> x, doublev<Abi> y);
586template <class Abi> simd_mask<long double, Abi> islessgreater(ldoublev<Abi> x, ldoublev<Abi> y);
587
588template <class Abi> simd_mask<float, Abi> isunordered(floatv<Abi> x, floatv<Abi> y);
589template <class Abi> simd_mask<double, Abi> isunordered(doublev<Abi> x, doublev<Abi> y);
590template <class Abi> simd_mask<long double, Abi> isunordered(ldoublev<Abi> x, ldoublev<Abi> y);
591
592template <class V> struct simd_div_t { V quot, rem; };
593template <class Abi> simd_div_t<scharv<Abi>> div(scharv<Abi> numer, scharv<Abi> denom);
594template <class Abi> simd_div_t<shortv<Abi>> div(shortv<Abi> numer, shortv<Abi> denom);
595template <class Abi> simd_div_t<intv<Abi>> div(intv<Abi> numer, intv<Abi> denom);
596template <class Abi> simd_div_t<longv<Abi>> div(longv<Abi> numer, longv<Abi> denom);
597template <class Abi> simd_div_t<llongv<Abi>> div(llongv<Abi> numer, llongv<Abi> denom);
598
599// [simd.mask.class]
600template <class T, class Abi>
601class simd_mask {
602public:
603 using value_type = bool;
604 using reference = see below;
605 using simd_type = simd<T, Abi>;
606 using abi_type = Abi;
607 static constexpr size_t size() noexcept;
608 simd_mask() = default;
609
610 // broadcast constructor
611 explicit simd_mask(value_type) noexcept;
612
613 // implicit type conversion constructor
614 template <class U> simd_mask(const simd_mask<U, simd_abi::fixed_size<size()>>&) noexcept;
615
616 // load constructor
617 template <class Flags> simd_mask(const value_type* mem, Flags);
618
619 // loads [simd.mask.copy]
620 template <class Flags> void copy_from(const value_type* mem, Flags);
621 template <class Flags> void copy_to(value_type* mem, Flags) const;
622
623 // scalar access [simd.mask.subscr]
624 reference operator[](size_t);
625 value_type operator[](size_t) const;
626
627 // unary operators [simd.mask.unary]
628 simd_mask operator!() const noexcept;
629
630 // simd_mask binary operators [simd.mask.binary]
631 friend simd_mask operator&&(const simd_mask&, const simd_mask&) noexcept;
632 friend simd_mask operator||(const simd_mask&, const simd_mask&) noexcept;
633 friend simd_mask operator& (const simd_mask&, const simd_mask&) noexcept;
634 friend simd_mask operator| (const simd_mask&, const simd_mask&) noexcept;
635 friend simd_mask operator^ (const simd_mask&, const simd_mask&) noexcept;
636
637 // simd_mask compound assignment [simd.mask.cassign]
638 friend simd_mask& operator&=(simd_mask&, const simd_mask&) noexcept;
639 friend simd_mask& operator|=(simd_mask&, const simd_mask&) noexcept;
640 friend simd_mask& operator^=(simd_mask&, const simd_mask&) noexcept;
641
642 // simd_mask compares [simd.mask.comparison]
643 friend simd_mask operator==(const simd_mask&, const simd_mask&) noexcept;
644 friend simd_mask operator!=(const simd_mask&, const simd_mask&) noexcept;
645};
646
647} // parallelism_v2
648} // std::experimental
649
650*/
651
Tim Shend87ea292018-07-30 22:27:38 +0000652#include <algorithm>
Tim Shen158e51b2018-04-23 21:54:06 +0000653#include <array>
654#include <cstddef>
Arthur O'Dwyer65077c02022-01-07 09:45:05 -0500655#include <experimental/__config>
Tim Shen158e51b2018-04-23 21:54:06 +0000656#include <functional>
657
658#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER)
Arthur O'Dwyer6eeaa002022-02-01 20:16:40 -0500659# pragma GCC system_header
Tim Shen158e51b2018-04-23 21:54:06 +0000660#endif
661
Arthur O'Dwyer2422fa22020-12-02 18:55:01 -0500662_LIBCPP_PUSH_MACROS
663#include <__undef_macros>
664
Tim Shen158e51b2018-04-23 21:54:06 +0000665_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD
666
Tim Shend87ea292018-07-30 22:27:38 +0000667#if _LIBCPP_STD_VER >= 17
668
Tim Shen158e51b2018-04-23 21:54:06 +0000669enum class _StorageKind {
670 _Scalar,
671 _Array,
Tim Shend87ea292018-07-30 22:27:38 +0000672 _VecExt,
Tim Shen158e51b2018-04-23 21:54:06 +0000673};
674
675template <_StorageKind __kind, int _Np>
676struct __simd_abi {};
677
678template <class _Tp, class _Abi>
Tim Shend87ea292018-07-30 22:27:38 +0000679class __simd_storage {};
Tim Shen158e51b2018-04-23 21:54:06 +0000680
681template <class _Tp, int __num_element>
Tim Shend87ea292018-07-30 22:27:38 +0000682class __simd_storage<_Tp, __simd_abi<_StorageKind::_Array, __num_element>> {
683 std::array<_Tp, __num_element> __storage_;
684
685 template <class, class>
686 friend struct simd;
687
688 template <class, class>
689 friend struct simd_mask;
690
691public:
Nikolas Klauser2ef542d2022-01-13 00:07:01 +0100692 _Tp __get(size_t __index) const noexcept { return __storage_[__index]; }
Tim Shend87ea292018-07-30 22:27:38 +0000693 void __set(size_t __index, _Tp __val) noexcept {
694 __storage_[__index] = __val;
695 }
Tim Shen158e51b2018-04-23 21:54:06 +0000696};
697
698template <class _Tp>
Tim Shend87ea292018-07-30 22:27:38 +0000699class __simd_storage<_Tp, __simd_abi<_StorageKind::_Scalar, 1>> {
700 _Tp __storage_;
701
702 template <class, class>
703 friend struct simd;
704
705 template <class, class>
706 friend struct simd_mask;
707
708public:
Nikolas Klauser2ef542d2022-01-13 00:07:01 +0100709 _Tp __get(size_t __index) const noexcept { return (&__storage_)[__index]; }
Tim Shend87ea292018-07-30 22:27:38 +0000710 void __set(size_t __index, _Tp __val) noexcept {
711 (&__storage_)[__index] = __val;
712 }
713};
714
715#ifndef _LIBCPP_HAS_NO_VECTOR_EXTENSION
716
717constexpr size_t __floor_pow_of_2(size_t __val) {
718 return ((__val - 1) & __val) == 0 ? __val
719 : __floor_pow_of_2((__val - 1) & __val);
720}
721
722constexpr size_t __ceil_pow_of_2(size_t __val) {
723 return __val == 1 ? 1 : __floor_pow_of_2(__val - 1) << 1;
724}
725
726template <class _Tp, size_t __bytes>
727struct __vec_ext_traits {
Marek Kurdejf3197922021-04-01 08:29:55 +0200728#if !defined(_LIBCPP_COMPILER_CLANG_BASED)
Tim Shend87ea292018-07-30 22:27:38 +0000729 typedef _Tp type __attribute__((vector_size(__ceil_pow_of_2(__bytes))));
730#endif
731};
732
Marek Kurdejf3197922021-04-01 08:29:55 +0200733#if defined(_LIBCPP_COMPILER_CLANG_BASED)
Tim Shend87ea292018-07-30 22:27:38 +0000734#define _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, _NUM_ELEMENT) \
735 template <> \
736 struct __vec_ext_traits<_TYPE, sizeof(_TYPE) * _NUM_ELEMENT> { \
737 using type = \
738 _TYPE __attribute__((vector_size(sizeof(_TYPE) * _NUM_ELEMENT))); \
739 }
740
741#define _LIBCPP_SPECIALIZE_VEC_EXT_32(_TYPE) \
742 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 1); \
743 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 2); \
744 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 3); \
745 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 4); \
746 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 5); \
747 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 6); \
748 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 7); \
749 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 8); \
750 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 9); \
751 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 10); \
752 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 11); \
753 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 12); \
754 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 13); \
755 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 14); \
756 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 15); \
757 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 16); \
758 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 17); \
759 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 18); \
760 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 19); \
761 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 20); \
762 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 21); \
763 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 22); \
764 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 23); \
765 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 24); \
766 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 25); \
767 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 26); \
768 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 27); \
769 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 28); \
770 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 29); \
771 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 30); \
772 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 31); \
Nikolas Klauser2ef542d2022-01-13 00:07:01 +0100773 _LIBCPP_SPECIALIZE_VEC_EXT(_TYPE, 32)
Tim Shend87ea292018-07-30 22:27:38 +0000774
775_LIBCPP_SPECIALIZE_VEC_EXT_32(char);
776_LIBCPP_SPECIALIZE_VEC_EXT_32(char16_t);
777_LIBCPP_SPECIALIZE_VEC_EXT_32(char32_t);
778_LIBCPP_SPECIALIZE_VEC_EXT_32(wchar_t);
779_LIBCPP_SPECIALIZE_VEC_EXT_32(signed char);
780_LIBCPP_SPECIALIZE_VEC_EXT_32(signed short);
781_LIBCPP_SPECIALIZE_VEC_EXT_32(signed int);
782_LIBCPP_SPECIALIZE_VEC_EXT_32(signed long);
783_LIBCPP_SPECIALIZE_VEC_EXT_32(signed long long);
784_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned char);
785_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned short);
786_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned int);
787_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned long);
788_LIBCPP_SPECIALIZE_VEC_EXT_32(unsigned long long);
789_LIBCPP_SPECIALIZE_VEC_EXT_32(float);
790_LIBCPP_SPECIALIZE_VEC_EXT_32(double);
791_LIBCPP_SPECIALIZE_VEC_EXT_32(long double);
792
793#undef _LIBCPP_SPECIALIZE_VEC_EXT_32
794#undef _LIBCPP_SPECIALIZE_VEC_EXT
795#endif
796
797template <class _Tp, int __num_element>
798class __simd_storage<_Tp, __simd_abi<_StorageKind::_VecExt, __num_element>> {
799 using _StorageType =
800 typename __vec_ext_traits<_Tp, sizeof(_Tp) * __num_element>::type;
801
802 _StorageType __storage_;
803
804 template <class, class>
805 friend struct simd;
806
807 template <class, class>
808 friend struct simd_mask;
809
810public:
Nikolas Klauser2ef542d2022-01-13 00:07:01 +0100811 _Tp __get(size_t __index) const noexcept { return __storage_[__index]; }
Tim Shend87ea292018-07-30 22:27:38 +0000812 void __set(size_t __index, _Tp __val) noexcept {
813 __storage_[__index] = __val;
814 }
815};
816
817#endif // _LIBCPP_HAS_NO_VECTOR_EXTENSION
818
819template <class _Vp, class _Tp, class _Abi>
820class __simd_reference {
821 static_assert(std::is_same<_Vp, _Tp>::value, "");
822
823 template <class, class>
824 friend struct simd;
825
826 template <class, class>
827 friend struct simd_mask;
828
829 __simd_storage<_Tp, _Abi>* __ptr_;
830 size_t __index_;
831
832 __simd_reference(__simd_storage<_Tp, _Abi>* __ptr, size_t __index)
833 : __ptr_(__ptr), __index_(__index) {}
834
835 __simd_reference(const __simd_reference&) = default;
836
837public:
838 __simd_reference() = delete;
839 __simd_reference& operator=(const __simd_reference&) = delete;
840
841 operator _Vp() const { return __ptr_->__get(__index_); }
842
843 __simd_reference operator=(_Vp __value) && {
844 __ptr_->__set(__index_, __value);
845 return *this;
846 }
847
848 __simd_reference operator++() && {
849 return std::move(*this) = __ptr_->__get(__index_) + 1;
850 }
851
852 _Vp operator++(int) && {
853 auto __val = __ptr_->__get(__index_);
854 __ptr_->__set(__index_, __val + 1);
855 return __val;
856 }
857
858 __simd_reference operator--() && {
859 return std::move(*this) = __ptr_->__get(__index_) - 1;
860 }
861
862 _Vp operator--(int) && {
863 auto __val = __ptr_->__get(__index_);
864 __ptr_->__set(__index_, __val - 1);
865 return __val;
866 }
867
868 __simd_reference operator+=(_Vp __value) && {
869 return std::move(*this) = __ptr_->__get(__index_) + __value;
870 }
871
872 __simd_reference operator-=(_Vp __value) && {
873 return std::move(*this) = __ptr_->__get(__index_) - __value;
874 }
875
876 __simd_reference operator*=(_Vp __value) && {
877 return std::move(*this) = __ptr_->__get(__index_) * __value;
878 }
879
880 __simd_reference operator/=(_Vp __value) && {
881 return std::move(*this) = __ptr_->__get(__index_) / __value;
882 }
883
884 __simd_reference operator%=(_Vp __value) && {
885 return std::move(*this) = __ptr_->__get(__index_) % __value;
886 }
887
888 __simd_reference operator>>=(_Vp __value) && {
889 return std::move(*this) = __ptr_->__get(__index_) >> __value;
890 }
891
892 __simd_reference operator<<=(_Vp __value) && {
893 return std::move(*this) = __ptr_->__get(__index_) << __value;
894 }
895
896 __simd_reference operator&=(_Vp __value) && {
897 return std::move(*this) = __ptr_->__get(__index_) & __value;
898 }
899
900 __simd_reference operator|=(_Vp __value) && {
901 return std::move(*this) = __ptr_->__get(__index_) | __value;
902 }
903
904 __simd_reference operator^=(_Vp __value) && {
905 return std::move(*this) = __ptr_->__get(__index_) ^ __value;
906 }
Tim Shen158e51b2018-04-23 21:54:06 +0000907};
908
909template <class _To, class _From>
910constexpr decltype(_To{std::declval<_From>()}, true)
911__is_non_narrowing_convertible_impl(_From) {
912 return true;
913}
914
915template <class _To>
916constexpr bool __is_non_narrowing_convertible_impl(...) {
917 return false;
918}
919
920template <class _From, class _To>
921constexpr typename std::enable_if<std::is_arithmetic<_To>::value &&
922 std::is_arithmetic<_From>::value,
923 bool>::type
924__is_non_narrowing_arithmetic_convertible() {
925 return __is_non_narrowing_convertible_impl<_To>(_From{});
926}
927
928template <class _From, class _To>
929constexpr typename std::enable_if<!(std::is_arithmetic<_To>::value &&
930 std::is_arithmetic<_From>::value),
931 bool>::type
932__is_non_narrowing_arithmetic_convertible() {
933 return false;
934}
935
936template <class _Tp>
937constexpr _Tp __variadic_sum() {
938 return _Tp{};
939}
940
941template <class _Tp, class _Up, class... _Args>
942constexpr _Tp __variadic_sum(_Up __first, _Args... __rest) {
943 return static_cast<_Tp>(__first) + __variadic_sum<_Tp>(__rest...);
944}
945
Tim Shend87ea292018-07-30 22:27:38 +0000946template <class _Tp>
947struct __nodeduce {
948 using type = _Tp;
949};
950
951template <class _Tp>
952constexpr bool __vectorizable() {
953 return std::is_arithmetic<_Tp>::value && !std::is_const<_Tp>::value &&
954 !std::is_volatile<_Tp>::value && !std::is_same<_Tp, bool>::value;
955}
956
Tim Shen158e51b2018-04-23 21:54:06 +0000957_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD
958_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD_ABI
959
960using scalar = __simd_abi<_StorageKind::_Scalar, 1>;
961
962template <int _Np>
963using fixed_size = __simd_abi<_StorageKind::_Array, _Np>;
964
Tim Shen158e51b2018-04-23 21:54:06 +0000965template <class _Tp>
Louis Dionne559be102021-09-22 09:35:32 -0400966inline constexpr size_t max_fixed_size = 32;
Tim Shend87ea292018-07-30 22:27:38 +0000967
Tim Shen158e51b2018-04-23 21:54:06 +0000968template <class _Tp>
969using compatible = fixed_size<16 / sizeof(_Tp)>;
Tim Shend87ea292018-07-30 22:27:38 +0000970
971#ifndef _LIBCPP_HAS_NO_VECTOR_EXTENSION
Tim Shen158e51b2018-04-23 21:54:06 +0000972template <class _Tp>
Tim Shend87ea292018-07-30 22:27:38 +0000973using native = __simd_abi<_StorageKind::_VecExt,
974 _LIBCPP_NATIVE_SIMD_WIDTH_IN_BYTES / sizeof(_Tp)>;
975#else
976template <class _Tp>
977using native =
978 fixed_size<_Tp, _LIBCPP_NATIVE_SIMD_WIDTH_IN_BYTES / sizeof(_Tp)>;
979#endif // _LIBCPP_HAS_NO_VECTOR_EXTENSION
Tim Shen158e51b2018-04-23 21:54:06 +0000980
981_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD_ABI
982_LIBCPP_BEGIN_NAMESPACE_EXPERIMENTAL_SIMD
983
984template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
985class simd;
986template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
987class simd_mask;
988
989struct element_aligned_tag {};
990struct vector_aligned_tag {};
991template <size_t>
992struct overaligned_tag {};
Louis Dionne559be102021-09-22 09:35:32 -0400993inline constexpr element_aligned_tag element_aligned{};
994inline constexpr vector_aligned_tag vector_aligned{};
Tim Shen158e51b2018-04-23 21:54:06 +0000995template <size_t _Np>
Louis Dionne559be102021-09-22 09:35:32 -0400996inline constexpr overaligned_tag<_Np> overaligned{};
Tim Shen158e51b2018-04-23 21:54:06 +0000997
998// traits [simd.traits]
999template <class _Tp>
1000struct is_abi_tag : std::integral_constant<bool, false> {};
1001
1002template <_StorageKind __kind, int _Np>
1003struct is_abi_tag<__simd_abi<__kind, _Np>>
1004 : std::integral_constant<bool, true> {};
1005
1006template <class _Tp>
1007struct is_simd : std::integral_constant<bool, false> {};
1008
1009template <class _Tp, class _Abi>
1010struct is_simd<simd<_Tp, _Abi>> : std::integral_constant<bool, true> {};
1011
1012template <class _Tp>
1013struct is_simd_mask : std::integral_constant<bool, false> {};
1014
1015template <class _Tp, class _Abi>
1016struct is_simd_mask<simd_mask<_Tp, _Abi>> : std::integral_constant<bool, true> {
1017};
1018
1019template <class _Tp>
1020struct is_simd_flag_type : std::integral_constant<bool, false> {};
1021
1022template <>
1023struct is_simd_flag_type<element_aligned_tag>
1024 : std::integral_constant<bool, true> {};
1025
1026template <>
1027struct is_simd_flag_type<vector_aligned_tag>
1028 : std::integral_constant<bool, true> {};
1029
1030template <size_t _Align>
1031struct is_simd_flag_type<overaligned_tag<_Align>>
1032 : std::integral_constant<bool, true> {};
1033
Tim Shen158e51b2018-04-23 21:54:06 +00001034template <class _Tp>
Louis Dionne559be102021-09-22 09:35:32 -04001035inline constexpr bool is_abi_tag_v = is_abi_tag<_Tp>::value;
Tim Shen158e51b2018-04-23 21:54:06 +00001036template <class _Tp>
Louis Dionne559be102021-09-22 09:35:32 -04001037inline constexpr bool is_simd_v = is_simd<_Tp>::value;
Tim Shen158e51b2018-04-23 21:54:06 +00001038template <class _Tp>
Louis Dionne559be102021-09-22 09:35:32 -04001039inline constexpr bool is_simd_mask_v = is_simd_mask<_Tp>::value;
Tim Shen158e51b2018-04-23 21:54:06 +00001040template <class _Tp>
Louis Dionne559be102021-09-22 09:35:32 -04001041inline constexpr bool is_simd_flag_type_v = is_simd_flag_type<_Tp>::value;
Tim Shen158e51b2018-04-23 21:54:06 +00001042template <class _Tp, size_t _Np>
1043struct abi_for_size {
1044 using type = simd_abi::fixed_size<_Np>;
1045};
1046template <class _Tp, size_t _Np>
1047using abi_for_size_t = typename abi_for_size<_Tp, _Np>::type;
1048
1049template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
1050struct simd_size;
1051
1052template <class _Tp, _StorageKind __kind, int _Np>
1053struct simd_size<_Tp, __simd_abi<__kind, _Np>>
1054 : std::integral_constant<size_t, _Np> {
1055 static_assert(
1056 std::is_arithmetic<_Tp>::value &&
1057 !std::is_same<typename std::remove_const<_Tp>::type, bool>::value,
1058 "Element type should be vectorizable");
1059};
1060
Tim Shend87ea292018-07-30 22:27:38 +00001061// TODO: implement it.
Tim Shen158e51b2018-04-23 21:54:06 +00001062template <class _Tp, class _Up = typename _Tp::value_type>
1063struct memory_alignment;
1064
Tim Shen158e51b2018-04-23 21:54:06 +00001065template <class _Tp, class _Abi = simd_abi::compatible<_Tp>>
Louis Dionne559be102021-09-22 09:35:32 -04001066inline constexpr size_t simd_size_v = simd_size<_Tp, _Abi>::value;
Tim Shen158e51b2018-04-23 21:54:06 +00001067
1068template <class _Tp, class _Up = typename _Tp::value_type>
Louis Dionne559be102021-09-22 09:35:32 -04001069inline constexpr size_t memory_alignment_v = memory_alignment<_Tp, _Up>::value;
Tim Shen158e51b2018-04-23 21:54:06 +00001070
1071// class template simd [simd.class]
1072template <class _Tp>
1073using native_simd = simd<_Tp, simd_abi::native<_Tp>>;
1074template <class _Tp, int _Np>
1075using fixed_size_simd = simd<_Tp, simd_abi::fixed_size<_Np>>;
1076
1077// class template simd_mask [simd.mask.class]
1078template <class _Tp>
1079using native_simd_mask = simd_mask<_Tp, simd_abi::native<_Tp>>;
1080
1081template <class _Tp, int _Np>
1082using fixed_size_simd_mask = simd_mask<_Tp, simd_abi::fixed_size<_Np>>;
1083
1084// casts [simd.casts]
1085template <class _Tp>
1086struct __static_simd_cast_traits {
1087 template <class _Up, class _Abi>
1088 static simd<_Tp, _Abi> __apply(const simd<_Up, _Abi>& __v);
1089};
1090
1091template <class _Tp, class _NewAbi>
1092struct __static_simd_cast_traits<simd<_Tp, _NewAbi>> {
1093 template <class _Up, class _Abi>
1094 static typename std::enable_if<simd<_Up, _Abi>::size() ==
1095 simd<_Tp, _NewAbi>::size(),
1096 simd<_Tp, _NewAbi>>::type
1097 __apply(const simd<_Up, _Abi>& __v);
1098};
1099
1100template <class _Tp>
1101struct __simd_cast_traits {
1102 template <class _Up, class _Abi>
1103 static typename std::enable_if<
1104 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>(),
1105 simd<_Tp, _Abi>>::type
1106 __apply(const simd<_Up, _Abi>& __v);
1107};
1108
1109template <class _Tp, class _NewAbi>
1110struct __simd_cast_traits<simd<_Tp, _NewAbi>> {
1111 template <class _Up, class _Abi>
1112 static typename std::enable_if<
1113 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>() &&
1114 simd<_Up, _Abi>::size() == simd<_Tp, _NewAbi>::size(),
1115 simd<_Tp, _NewAbi>>::type
1116 __apply(const simd<_Up, _Abi>& __v);
1117};
1118
1119template <class _Tp, class _Up, class _Abi>
1120auto simd_cast(const simd<_Up, _Abi>& __v)
1121 -> decltype(__simd_cast_traits<_Tp>::__apply(__v)) {
1122 return __simd_cast_traits<_Tp>::__apply(__v);
1123}
1124
1125template <class _Tp, class _Up, class _Abi>
1126auto static_simd_cast(const simd<_Up, _Abi>& __v)
1127 -> decltype(__static_simd_cast_traits<_Tp>::__apply(__v)) {
1128 return __static_simd_cast_traits<_Tp>::__apply(__v);
1129}
1130
1131template <class _Tp, class _Abi>
1132fixed_size_simd<_Tp, simd_size<_Tp, _Abi>::value>
1133to_fixed_size(const simd<_Tp, _Abi>&) noexcept;
1134
1135template <class _Tp, class _Abi>
1136fixed_size_simd_mask<_Tp, simd_size<_Tp, _Abi>::value>
1137to_fixed_size(const simd_mask<_Tp, _Abi>&) noexcept;
1138
1139template <class _Tp, size_t _Np>
1140native_simd<_Tp> to_native(const fixed_size_simd<_Tp, _Np>&) noexcept;
1141
1142template <class _Tp, size_t _Np>
1143native_simd_mask<_Tp> to_native(const fixed_size_simd_mask<_Tp, _Np>&) noexcept;
1144
1145template <class _Tp, size_t _Np>
1146simd<_Tp> to_compatible(const fixed_size_simd<_Tp, _Np>&) noexcept;
1147
1148template <class _Tp, size_t _Np>
1149simd_mask<_Tp> to_compatible(const fixed_size_simd_mask<_Tp, _Np>&) noexcept;
1150
1151template <size_t... __sizes, class _Tp, class _Abi>
1152tuple<simd<_Tp, abi_for_size_t<_Tp, __sizes>>...> split(const simd<_Tp, _Abi>&);
1153
1154template <size_t... __sizes, class _Tp, class _Abi>
1155tuple<simd_mask<_Tp, abi_for_size_t<_Tp, __sizes>>...>
1156split(const simd_mask<_Tp, _Abi>&);
1157
1158template <class _SimdType, class _Abi>
1159array<_SimdType, simd_size<typename _SimdType::value_type, _Abi>::value /
1160 _SimdType::size()>
1161split(const simd<typename _SimdType::value_type, _Abi>&);
1162
1163template <class _SimdType, class _Abi>
1164array<_SimdType, simd_size<typename _SimdType::value_type, _Abi>::value /
1165 _SimdType::size()>
1166split(const simd_mask<typename _SimdType::value_type, _Abi>&);
1167
1168template <class _Tp, class... _Abis>
1169simd<_Tp, abi_for_size_t<_Tp, __variadic_sum(simd_size<_Tp, _Abis>::value...)>>
1170concat(const simd<_Tp, _Abis>&...);
1171
1172template <class _Tp, class... _Abis>
1173simd_mask<_Tp,
1174 abi_for_size_t<_Tp, __variadic_sum(simd_size<_Tp, _Abis>::value...)>>
1175concat(const simd_mask<_Tp, _Abis>&...);
1176
1177// reductions [simd.mask.reductions]
1178template <class _Tp, class _Abi>
1179bool all_of(const simd_mask<_Tp, _Abi>&) noexcept;
1180template <class _Tp, class _Abi>
1181bool any_of(const simd_mask<_Tp, _Abi>&) noexcept;
1182template <class _Tp, class _Abi>
1183bool none_of(const simd_mask<_Tp, _Abi>&) noexcept;
1184template <class _Tp, class _Abi>
1185bool some_of(const simd_mask<_Tp, _Abi>&) noexcept;
1186template <class _Tp, class _Abi>
1187int popcount(const simd_mask<_Tp, _Abi>&) noexcept;
1188template <class _Tp, class _Abi>
1189int find_first_set(const simd_mask<_Tp, _Abi>&);
1190template <class _Tp, class _Abi>
1191int find_last_set(const simd_mask<_Tp, _Abi>&);
1192bool all_of(bool) noexcept;
1193bool any_of(bool) noexcept;
1194bool none_of(bool) noexcept;
1195bool some_of(bool) noexcept;
1196int popcount(bool) noexcept;
1197int find_first_set(bool) noexcept;
1198int find_last_set(bool) noexcept;
1199
1200// masked assignment [simd.whereexpr]
1201template <class _MaskType, class _Tp>
1202class const_where_expression;
1203template <class _MaskType, class _Tp>
1204class where_expression;
1205
1206// masked assignment [simd.mask.where]
Tim Shen158e51b2018-04-23 21:54:06 +00001207template <class _Tp, class _Abi>
1208where_expression<simd_mask<_Tp, _Abi>, simd<_Tp, _Abi>>
1209where(const typename simd<_Tp, _Abi>::mask_type&, simd<_Tp, _Abi>&) noexcept;
1210
1211template <class _Tp, class _Abi>
1212const_where_expression<simd_mask<_Tp, _Abi>, const simd<_Tp, _Abi>>
1213where(const typename simd<_Tp, _Abi>::mask_type&,
1214 const simd<_Tp, _Abi>&) noexcept;
1215
1216template <class _Tp, class _Abi>
1217where_expression<simd_mask<_Tp, _Abi>, simd_mask<_Tp, _Abi>>
1218where(const typename __nodeduce<simd_mask<_Tp, _Abi>>::type&,
1219 simd_mask<_Tp, _Abi>&) noexcept;
1220
1221template <class _Tp, class _Abi>
1222const_where_expression<simd_mask<_Tp, _Abi>, const simd_mask<_Tp, _Abi>>
1223where(const typename __nodeduce<simd_mask<_Tp, _Abi>>::type&,
1224 const simd_mask<_Tp, _Abi>&) noexcept;
1225
1226template <class _Tp>
1227where_expression<bool, _Tp> where(bool, _Tp&) noexcept;
1228
1229template <class _Tp>
1230const_where_expression<bool, const _Tp> where(bool, const _Tp&) noexcept;
1231
1232// reductions [simd.reductions]
1233template <class _Tp, class _Abi, class _BinaryOp = std::plus<_Tp>>
1234_Tp reduce(const simd<_Tp, _Abi>&, _BinaryOp = _BinaryOp());
1235
1236template <class _MaskType, class _SimdType, class _BinaryOp>
1237typename _SimdType::value_type
1238reduce(const const_where_expression<_MaskType, _SimdType>&,
1239 typename _SimdType::value_type neutral_element, _BinaryOp binary_op);
1240
1241template <class _MaskType, class _SimdType>
1242typename _SimdType::value_type
1243reduce(const const_where_expression<_MaskType, _SimdType>&,
1244 plus<typename _SimdType::value_type> binary_op = {});
1245
1246template <class _MaskType, class _SimdType>
1247typename _SimdType::value_type
1248reduce(const const_where_expression<_MaskType, _SimdType>&,
1249 multiplies<typename _SimdType::value_type> binary_op);
1250
1251template <class _MaskType, class _SimdType>
1252typename _SimdType::value_type
1253reduce(const const_where_expression<_MaskType, _SimdType>&,
1254 bit_and<typename _SimdType::value_type> binary_op);
1255
1256template <class _MaskType, class _SimdType>
1257typename _SimdType::value_type
1258reduce(const const_where_expression<_MaskType, _SimdType>&,
1259 bit_or<typename _SimdType::value_type> binary_op);
1260
1261template <class _MaskType, class _SimdType>
1262typename _SimdType::value_type
1263reduce(const const_where_expression<_MaskType, _SimdType>&,
1264 bit_xor<typename _SimdType::value_type> binary_op);
1265
1266template <class _Tp, class _Abi>
1267_Tp hmin(const simd<_Tp, _Abi>&);
1268template <class _MaskType, class _SimdType>
1269typename _SimdType::value_type
1270hmin(const const_where_expression<_MaskType, _SimdType>&);
1271template <class _Tp, class _Abi>
1272_Tp hmax(const simd<_Tp, _Abi>&);
1273template <class _MaskType, class _SimdType>
1274typename _SimdType::value_type
1275hmax(const const_where_expression<_MaskType, _SimdType>&);
1276
1277// algorithms [simd.alg]
1278template <class _Tp, class _Abi>
1279simd<_Tp, _Abi> min(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1280
1281template <class _Tp, class _Abi>
1282simd<_Tp, _Abi> max(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1283
1284template <class _Tp, class _Abi>
1285std::pair<simd<_Tp, _Abi>, simd<_Tp, _Abi>>
1286minmax(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&) noexcept;
1287
1288template <class _Tp, class _Abi>
1289simd<_Tp, _Abi> clamp(const simd<_Tp, _Abi>&, const simd<_Tp, _Abi>&,
1290 const simd<_Tp, _Abi>&);
1291
1292// [simd.whereexpr]
1293// TODO implement where expressions.
1294template <class _MaskType, class _Tp>
1295class const_where_expression {
1296public:
1297 const_where_expression(const const_where_expression&) = delete;
1298 const_where_expression& operator=(const const_where_expression&) = delete;
1299 typename remove_const<_Tp>::type operator-() const&&;
1300 template <class _Up, class _Flags>
1301 void copy_to(_Up*, _Flags) const&&;
1302};
1303
1304template <class _MaskType, class _Tp>
1305class where_expression : public const_where_expression<_MaskType, _Tp> {
1306public:
1307 where_expression(const where_expression&) = delete;
1308 where_expression& operator=(const where_expression&) = delete;
1309 template <class _Up>
1310 void operator=(_Up&&);
1311 template <class _Up>
1312 void operator+=(_Up&&);
1313 template <class _Up>
1314 void operator-=(_Up&&);
1315 template <class _Up>
1316 void operator*=(_Up&&);
1317 template <class _Up>
1318 void operator/=(_Up&&);
1319 template <class _Up>
1320 void operator%=(_Up&&);
1321 template <class _Up>
1322 void operator&=(_Up&&);
1323 template <class _Up>
1324 void operator|=(_Up&&);
1325 template <class _Up>
1326 void operator^=(_Up&&);
1327 template <class _Up>
1328 void operator<<=(_Up&&);
1329 template <class _Up>
1330 void operator>>=(_Up&&);
1331 void operator++();
1332 void operator++(int);
1333 void operator--();
1334 void operator--(int);
1335 template <class _Up, class _Flags>
1336 void copy_from(const _Up*, _Flags);
1337};
1338
1339// [simd.class]
1340// TODO: implement simd
1341template <class _Tp, class _Abi>
1342class simd {
Tim Shend87ea292018-07-30 22:27:38 +00001343public:
1344 using value_type = _Tp;
1345 using reference = __simd_reference<_Tp, _Tp, _Abi>;
1346 using mask_type = simd_mask<_Tp, _Abi>;
1347 using abi_type = _Abi;
1348
1349 simd() = default;
1350 simd(const simd&) = default;
1351 simd& operator=(const simd&) = default;
1352
1353 static constexpr size_t size() noexcept {
1354 return simd_size<_Tp, _Abi>::value;
1355 }
1356
Tim Shen158e51b2018-04-23 21:54:06 +00001357private:
Tim Shend87ea292018-07-30 22:27:38 +00001358 __simd_storage<_Tp, _Abi> __s_;
1359
Tim Shen158e51b2018-04-23 21:54:06 +00001360 template <class _Up>
1361 static constexpr bool __can_broadcast() {
1362 return (std::is_arithmetic<_Up>::value &&
1363 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>()) ||
1364 (!std::is_arithmetic<_Up>::value &&
1365 std::is_convertible<_Up, _Tp>::value) ||
1366 std::is_same<typename std::remove_const<_Up>::type, int>::value ||
1367 (std::is_same<typename std::remove_const<_Up>::type,
1368 unsigned int>::value &&
1369 std::is_unsigned<_Tp>::value);
1370 }
1371
Tim Shend87ea292018-07-30 22:27:38 +00001372 template <class _Generator, size_t... __indicies>
1373 static constexpr decltype(
1374 std::forward_as_tuple(std::declval<_Generator>()(
1375 std::integral_constant<size_t, __indicies>())...),
1376 bool())
1377 __can_generate(std::index_sequence<__indicies...>) {
1378 return !__variadic_sum<bool>(
1379 !__can_broadcast<decltype(std::declval<_Generator>()(
1380 std::integral_constant<size_t, __indicies>()))>()...);
Tim Shenddc239b2018-07-30 22:21:22 +00001381 }
1382
Tim Shend87ea292018-07-30 22:27:38 +00001383 template <class _Generator>
1384 static bool __can_generate(...) {
1385 return false;
1386 }
Tim Shenddc239b2018-07-30 22:21:22 +00001387
Tim Shend87ea292018-07-30 22:27:38 +00001388 template <class _Generator, size_t... __indicies>
1389 void __generator_init(_Generator&& __g, std::index_sequence<__indicies...>) {
1390 int __not_used[]{((*this)[__indicies] =
1391 __g(std::integral_constant<size_t, __indicies>()),
1392 0)...};
1393 (void)__not_used;
1394 }
1395
1396public:
Tim Shen158e51b2018-04-23 21:54:06 +00001397 // implicit type conversion constructor
1398 template <class _Up,
1399 class = typename std::enable_if<
1400 std::is_same<_Abi, simd_abi::fixed_size<size()>>::value &&
1401 __is_non_narrowing_arithmetic_convertible<_Up, _Tp>()>::type>
Tim Shend87ea292018-07-30 22:27:38 +00001402 simd(const simd<_Up, simd_abi::fixed_size<size()>>& __v) {
1403 for (size_t __i = 0; __i < size(); __i++) {
1404 (*this)[__i] = static_cast<_Tp>(__v[__i]);
1405 }
1406 }
Tim Shen158e51b2018-04-23 21:54:06 +00001407
1408 // implicit broadcast constructor
1409 template <class _Up,
1410 class = typename std::enable_if<__can_broadcast<_Up>()>::type>
Tim Shend87ea292018-07-30 22:27:38 +00001411 simd(_Up&& __rv) {
1412 auto __v = static_cast<_Tp>(__rv);
1413 for (size_t __i = 0; __i < size(); __i++) {
1414 (*this)[__i] = __v;
1415 }
1416 }
Tim Shen158e51b2018-04-23 21:54:06 +00001417
1418 // generator constructor
Tim Shen158e51b2018-04-23 21:54:06 +00001419 template <class _Generator,
Tim Shend87ea292018-07-30 22:27:38 +00001420 int = typename std::enable_if<
1421 __can_generate<_Generator>(std::make_index_sequence<size()>()),
1422 int>::type()>
1423 explicit simd(_Generator&& __g) {
1424 __generator_init(std::forward<_Generator>(__g),
1425 std::make_index_sequence<size()>());
1426 }
Tim Shen158e51b2018-04-23 21:54:06 +00001427
1428 // load constructor
Tim Shend87ea292018-07-30 22:27:38 +00001429 template <
1430 class _Up, class _Flags,
1431 class = typename std::enable_if<__vectorizable<_Up>()>::type,
1432 class = typename std::enable_if<is_simd_flag_type<_Flags>::value>::type>
1433 simd(const _Up* __buffer, _Flags) {
1434 // TODO: optimize for overaligned flags
1435 for (size_t __i = 0; __i < size(); __i++) {
1436 (*this)[__i] = static_cast<_Tp>(__buffer[__i]);
1437 }
1438 }
Tim Shen158e51b2018-04-23 21:54:06 +00001439
1440 // loads [simd.load]
1441 template <class _Up, class _Flags>
Tim Shend87ea292018-07-30 22:27:38 +00001442 typename std::enable_if<__vectorizable<_Up>() &&
1443 is_simd_flag_type<_Flags>::value>::type
1444 copy_from(const _Up* __buffer, _Flags) {
1445 *this = simd(__buffer, _Flags());
1446 }
Tim Shen158e51b2018-04-23 21:54:06 +00001447
1448 // stores [simd.store]
1449 template <class _Up, class _Flags>
Tim Shend87ea292018-07-30 22:27:38 +00001450 typename std::enable_if<__vectorizable<_Up>() &&
1451 is_simd_flag_type<_Flags>::value>::type
1452 copy_to(_Up* __buffer, _Flags) const {
1453 // TODO: optimize for overaligned flags
1454 for (size_t __i = 0; __i < size(); __i++) {
1455 __buffer[__i] = static_cast<_Up>((*this)[__i]);
1456 }
1457 }
Tim Shen158e51b2018-04-23 21:54:06 +00001458
1459 // scalar access [simd.subscr]
Tim Shend87ea292018-07-30 22:27:38 +00001460 reference operator[](size_t __i) { return reference(&__s_, __i); }
1461
1462 value_type operator[](size_t __i) const { return __s_.__get(__i); }
Tim Shen158e51b2018-04-23 21:54:06 +00001463
1464 // unary operators [simd.unary]
1465 simd& operator++();
1466 simd operator++(int);
1467 simd& operator--();
1468 simd operator--(int);
1469 mask_type operator!() const;
1470 simd operator~() const;
1471 simd operator+() const;
1472 simd operator-() const;
1473
1474 // binary operators [simd.binary]
1475 friend simd operator+(const simd&, const simd&);
1476 friend simd operator-(const simd&, const simd&);
1477 friend simd operator*(const simd&, const simd&);
1478 friend simd operator/(const simd&, const simd&);
1479 friend simd operator%(const simd&, const simd&);
1480 friend simd operator&(const simd&, const simd&);
1481 friend simd operator|(const simd&, const simd&);
1482 friend simd operator^(const simd&, const simd&);
1483 friend simd operator<<(const simd&, const simd&);
1484 friend simd operator>>(const simd&, const simd&);
1485 friend simd operator<<(const simd&, int);
1486 friend simd operator>>(const simd&, int);
1487
1488 // compound assignment [simd.cassign]
1489 friend simd& operator+=(simd&, const simd&);
1490 friend simd& operator-=(simd&, const simd&);
1491 friend simd& operator*=(simd&, const simd&);
1492 friend simd& operator/=(simd&, const simd&);
1493 friend simd& operator%=(simd&, const simd&);
1494
1495 friend simd& operator&=(simd&, const simd&);
1496 friend simd& operator|=(simd&, const simd&);
1497 friend simd& operator^=(simd&, const simd&);
1498 friend simd& operator<<=(simd&, const simd&);
1499 friend simd& operator>>=(simd&, const simd&);
1500 friend simd& operator<<=(simd&, int);
1501 friend simd& operator>>=(simd&, int);
1502
1503 // compares [simd.comparison]
1504 friend mask_type operator==(const simd&, const simd&);
1505 friend mask_type operator!=(const simd&, const simd&);
1506 friend mask_type operator>=(const simd&, const simd&);
1507 friend mask_type operator<=(const simd&, const simd&);
1508 friend mask_type operator>(const simd&, const simd&);
1509 friend mask_type operator<(const simd&, const simd&);
1510};
1511
1512// [simd.mask.class]
1513template <class _Tp, class _Abi>
1514// TODO: implement simd_mask
1515class simd_mask {
1516public:
1517 using value_type = bool;
1518 // TODO: this is strawman implementation. Turn it into a proxy type.
1519 using reference = bool&;
1520 using simd_type = simd<_Tp, _Abi>;
1521 using abi_type = _Abi;
1522 static constexpr size_t size() noexcept;
1523 simd_mask() = default;
1524
1525 // broadcast constructor
1526 explicit simd_mask(value_type) noexcept;
1527
1528 // implicit type conversion constructor
1529 template <class _Up>
1530 simd_mask(const simd_mask<_Up, simd_abi::fixed_size<size()>>&) noexcept;
1531
1532 // load constructor
1533 template <class _Flags>
1534 simd_mask(const value_type*, _Flags);
1535
1536 // loads [simd.mask.copy]
1537 template <class _Flags>
1538 void copy_from(const value_type*, _Flags);
1539 template <class _Flags>
1540 void copy_to(value_type*, _Flags) const;
1541
1542 // scalar access [simd.mask.subscr]
1543 reference operator[](size_t);
1544 value_type operator[](size_t) const;
1545
1546 // unary operators [simd.mask.unary]
1547 simd_mask operator!() const noexcept;
1548
1549 // simd_mask binary operators [simd.mask.binary]
1550 friend simd_mask operator&&(const simd_mask&, const simd_mask&) noexcept;
1551 friend simd_mask operator||(const simd_mask&, const simd_mask&) noexcept;
1552 friend simd_mask operator&(const simd_mask&, const simd_mask&)noexcept;
1553 friend simd_mask operator|(const simd_mask&, const simd_mask&) noexcept;
1554 friend simd_mask operator^(const simd_mask&, const simd_mask&) noexcept;
1555
1556 // simd_mask compound assignment [simd.mask.cassign]
1557 friend simd_mask& operator&=(simd_mask&, const simd_mask&) noexcept;
1558 friend simd_mask& operator|=(simd_mask&, const simd_mask&) noexcept;
1559 friend simd_mask& operator^=(simd_mask&, const simd_mask&) noexcept;
1560
1561 // simd_mask compares [simd.mask.comparison]
1562 friend simd_mask operator==(const simd_mask&, const simd_mask&) noexcept;
1563 friend simd_mask operator!=(const simd_mask&, const simd_mask&) noexcept;
1564};
1565
Tim Shend87ea292018-07-30 22:27:38 +00001566#endif // _LIBCPP_STD_VER >= 17
1567
Tim Shen158e51b2018-04-23 21:54:06 +00001568_LIBCPP_END_NAMESPACE_EXPERIMENTAL_SIMD
1569
Arthur O'Dwyer2422fa22020-12-02 18:55:01 -05001570_LIBCPP_POP_MACROS
1571
Tim Shen158e51b2018-04-23 21:54:06 +00001572#endif /* _LIBCPP_EXPERIMENTAL_SIMD */