blob: 240f4f4db5b7626f66bd072dd8723f3703e79099 [file] [log] [blame]
mtklein3e490b72015-03-20 06:33:02 -07001/*
2 * Copyright 2015 Google Inc.
3 *
4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file.
6 */
7
8#ifndef SkNx_DEFINED
9#define SkNx_DEFINED
10
Mike Kleinc0bd9f92019-04-23 12:05:21 -050011#include "include/core/SkScalar.h"
12#include "include/core/SkTypes.h"
13#include "include/private/SkSafe_math.h"
Hal Canaryc640d0d2018-06-13 09:59:02 -040014
15#include <algorithm>
mtkleinf8f90e42016-03-21 10:04:46 -070016#include <limits>
mtkleinf8f90e42016-03-21 10:04:46 -070017#include <type_traits>
mtklein082e3292015-08-12 11:56:43 -070018
Mike Klein7c78f3a2016-10-19 09:21:11 -040019// Every single SkNx method wants to be fully inlined. (We know better than MSVC).
20#define AI SK_ALWAYS_INLINE
Mike Klein1e764642016-10-14 17:09:03 -040021
Mike Kleinc33d6142018-12-12 08:47:54 -050022namespace { // NOLINT(google-build-namespaces)
mtkleinf8f90e42016-03-21 10:04:46 -070023
24// The default SkNx<N,T> just proxies down to a pair of SkNx<N/2, T>.
mtkleinc9adb052015-03-30 10:50:27 -070025template <int N, typename T>
mtkleinf8f90e42016-03-21 10:04:46 -070026struct SkNx {
mtkleine4c0bee2016-02-09 10:35:27 -080027 typedef SkNx<N/2, T> Half;
mtkleinf8f90e42016-03-21 10:04:46 -070028
29 Half fLo, fHi;
30
Mike Klein7c78f3a2016-10-19 09:21:11 -040031 AI SkNx() = default;
32 AI SkNx(const Half& lo, const Half& hi) : fLo(lo), fHi(hi) {}
mtkleine4c0bee2016-02-09 10:35:27 -080033
Mike Klein7c78f3a2016-10-19 09:21:11 -040034 AI SkNx(T v) : fLo(v), fHi(v) {}
mtkleinf8f90e42016-03-21 10:04:46 -070035
Mike Klein7c78f3a2016-10-19 09:21:11 -040036 AI SkNx(T a, T b) : fLo(a) , fHi(b) { static_assert(N==2, ""); }
37 AI SkNx(T a, T b, T c, T d) : fLo(a,b), fHi(c,d) { static_assert(N==4, ""); }
38 AI SkNx(T a, T b, T c, T d, T e, T f, T g, T h) : fLo(a,b,c,d), fHi(e,f,g,h) {
mtkleinf8f90e42016-03-21 10:04:46 -070039 static_assert(N==8, "");
40 }
Mike Klein7c78f3a2016-10-19 09:21:11 -040041 AI SkNx(T a, T b, T c, T d, T e, T f, T g, T h,
42 T i, T j, T k, T l, T m, T n, T o, T p)
43 : fLo(a,b,c,d, e,f,g,h), fHi(i,j,k,l, m,n,o,p) {
mtkleinf8f90e42016-03-21 10:04:46 -070044 static_assert(N==16, "");
mtklein6f37b4a2015-12-14 11:25:18 -080045 }
46
Mike Klein7c78f3a2016-10-19 09:21:11 -040047 AI T operator[](int k) const {
mtklein115acee2015-04-14 14:02:52 -070048 SkASSERT(0 <= k && k < N);
mtkleine4c0bee2016-02-09 10:35:27 -080049 return k < N/2 ? fLo[k] : fHi[k-N/2];
mtklein115acee2015-04-14 14:02:52 -070050 }
51
Mike Klein7c78f3a2016-10-19 09:21:11 -040052 AI static SkNx Load(const void* vptr) {
mtkleinf8f90e42016-03-21 10:04:46 -070053 auto ptr = (const char*)vptr;
54 return { Half::Load(ptr), Half::Load(ptr + N/2*sizeof(T)) };
55 }
Mike Klein7c78f3a2016-10-19 09:21:11 -040056 AI void store(void* vptr) const {
mtkleinf8f90e42016-03-21 10:04:46 -070057 auto ptr = (char*)vptr;
58 fLo.store(ptr);
59 fHi.store(ptr + N/2*sizeof(T));
mtkleinb5e86112015-06-24 15:18:39 -070060 }
61
Mike Klein7c78f3a2016-10-19 09:21:11 -040062 AI static void Load4(const void* vptr, SkNx* a, SkNx* b, SkNx* c, SkNx* d) {
Mike Klein33cbfd72016-10-06 11:09:27 -040063 auto ptr = (const char*)vptr;
64 Half al, bl, cl, dl,
65 ah, bh, ch, dh;
66 Half::Load4(ptr , &al, &bl, &cl, &dl);
67 Half::Load4(ptr + 4*N/2*sizeof(T), &ah, &bh, &ch, &dh);
68 *a = SkNx{al, ah};
69 *b = SkNx{bl, bh};
70 *c = SkNx{cl, ch};
71 *d = SkNx{dl, dh};
72 }
Matt Sarett5bee0b62017-01-19 12:04:32 -050073 AI static void Load3(const void* vptr, SkNx* a, SkNx* b, SkNx* c) {
74 auto ptr = (const char*)vptr;
75 Half al, bl, cl,
76 ah, bh, ch;
77 Half::Load3(ptr , &al, &bl, &cl);
78 Half::Load3(ptr + 3*N/2*sizeof(T), &ah, &bh, &ch);
79 *a = SkNx{al, ah};
80 *b = SkNx{bl, bh};
81 *c = SkNx{cl, ch};
82 }
Mike Klein213d8212017-11-30 12:07:20 -050083 AI static void Load2(const void* vptr, SkNx* a, SkNx* b) {
84 auto ptr = (const char*)vptr;
85 Half al, bl,
86 ah, bh;
87 Half::Load2(ptr , &al, &bl);
88 Half::Load2(ptr + 2*N/2*sizeof(T), &ah, &bh);
89 *a = SkNx{al, ah};
90 *b = SkNx{bl, bh};
91 }
Mike Klein7c78f3a2016-10-19 09:21:11 -040092 AI static void Store4(void* vptr, const SkNx& a, const SkNx& b, const SkNx& c, const SkNx& d) {
Mike Klein33cbfd72016-10-06 11:09:27 -040093 auto ptr = (char*)vptr;
94 Half::Store4(ptr, a.fLo, b.fLo, c.fLo, d.fLo);
95 Half::Store4(ptr + 4*N/2*sizeof(T), a.fHi, b.fHi, c.fHi, d.fHi);
96 }
Chris Dalton0cb75872017-12-01 13:23:05 -070097 AI static void Store3(void* vptr, const SkNx& a, const SkNx& b, const SkNx& c) {
98 auto ptr = (char*)vptr;
99 Half::Store3(ptr, a.fLo, b.fLo, c.fLo);
100 Half::Store3(ptr + 3*N/2*sizeof(T), a.fHi, b.fHi, c.fHi);
101 }
Chris Dalton42f02aa2018-04-08 23:58:43 -0600102 AI static void Store2(void* vptr, const SkNx& a, const SkNx& b) {
103 auto ptr = (char*)vptr;
104 Half::Store2(ptr, a.fLo, b.fLo);
105 Half::Store2(ptr + 2*N/2*sizeof(T), a.fHi, b.fHi);
106 }
Mike Klein33cbfd72016-10-06 11:09:27 -0400107
Mike Kleinbf45c702018-06-11 11:56:57 -0400108 AI T min() const { return SkTMin(fLo.min(), fHi.min()); }
109 AI T max() const { return SkTMax(fLo.max(), fHi.max()); }
Mike Klein7c78f3a2016-10-19 09:21:11 -0400110 AI bool anyTrue() const { return fLo.anyTrue() || fHi.anyTrue(); }
111 AI bool allTrue() const { return fLo.allTrue() && fHi.allTrue(); }
mtklein115acee2015-04-14 14:02:52 -0700112
Mike Klein7c78f3a2016-10-19 09:21:11 -0400113 AI SkNx abs() const { return { fLo. abs(), fHi. abs() }; }
114 AI SkNx sqrt() const { return { fLo. sqrt(), fHi. sqrt() }; }
115 AI SkNx rsqrt() const { return { fLo. rsqrt(), fHi. rsqrt() }; }
116 AI SkNx floor() const { return { fLo. floor(), fHi. floor() }; }
117 AI SkNx invert() const { return { fLo.invert(), fHi.invert() }; }
mtkleinf8f90e42016-03-21 10:04:46 -0700118
Mike Klein7c78f3a2016-10-19 09:21:11 -0400119 AI SkNx operator!() const { return { !fLo, !fHi }; }
120 AI SkNx operator-() const { return { -fLo, -fHi }; }
121 AI SkNx operator~() const { return { ~fLo, ~fHi }; }
mtkleinf8f90e42016-03-21 10:04:46 -0700122
Mike Klein7c78f3a2016-10-19 09:21:11 -0400123 AI SkNx operator<<(int bits) const { return { fLo << bits, fHi << bits }; }
124 AI SkNx operator>>(int bits) const { return { fLo >> bits, fHi >> bits }; }
mtkleinf8f90e42016-03-21 10:04:46 -0700125
Mike Klein7c78f3a2016-10-19 09:21:11 -0400126 AI SkNx operator+(const SkNx& y) const { return { fLo + y.fLo, fHi + y.fHi }; }
127 AI SkNx operator-(const SkNx& y) const { return { fLo - y.fLo, fHi - y.fHi }; }
128 AI SkNx operator*(const SkNx& y) const { return { fLo * y.fLo, fHi * y.fHi }; }
129 AI SkNx operator/(const SkNx& y) const { return { fLo / y.fLo, fHi / y.fHi }; }
mtkleinf8f90e42016-03-21 10:04:46 -0700130
Mike Klein7c78f3a2016-10-19 09:21:11 -0400131 AI SkNx operator&(const SkNx& y) const { return { fLo & y.fLo, fHi & y.fHi }; }
132 AI SkNx operator|(const SkNx& y) const { return { fLo | y.fLo, fHi | y.fHi }; }
133 AI SkNx operator^(const SkNx& y) const { return { fLo ^ y.fLo, fHi ^ y.fHi }; }
mtkleinf8f90e42016-03-21 10:04:46 -0700134
Mike Klein7c78f3a2016-10-19 09:21:11 -0400135 AI SkNx operator==(const SkNx& y) const { return { fLo == y.fLo, fHi == y.fHi }; }
136 AI SkNx operator!=(const SkNx& y) const { return { fLo != y.fLo, fHi != y.fHi }; }
137 AI SkNx operator<=(const SkNx& y) const { return { fLo <= y.fLo, fHi <= y.fHi }; }
138 AI SkNx operator>=(const SkNx& y) const { return { fLo >= y.fLo, fHi >= y.fHi }; }
139 AI SkNx operator< (const SkNx& y) const { return { fLo < y.fLo, fHi < y.fHi }; }
140 AI SkNx operator> (const SkNx& y) const { return { fLo > y.fLo, fHi > y.fHi }; }
mtkleinf8f90e42016-03-21 10:04:46 -0700141
Mike Klein7c78f3a2016-10-19 09:21:11 -0400142 AI SkNx saturatedAdd(const SkNx& y) const {
mtkleinf8f90e42016-03-21 10:04:46 -0700143 return { fLo.saturatedAdd(y.fLo), fHi.saturatedAdd(y.fHi) };
144 }
Herb Derby5eb15282017-10-10 17:14:18 -0400145
146 AI SkNx mulHi(const SkNx& m) const {
147 return { fLo.mulHi(m.fLo), fHi.mulHi(m.fHi) };
148 }
Mike Klein7c78f3a2016-10-19 09:21:11 -0400149 AI SkNx thenElse(const SkNx& t, const SkNx& e) const {
mtkleinf8f90e42016-03-21 10:04:46 -0700150 return { fLo.thenElse(t.fLo, e.fLo), fHi.thenElse(t.fHi, e.fHi) };
151 }
Mike Klein7c78f3a2016-10-19 09:21:11 -0400152 AI static SkNx Min(const SkNx& x, const SkNx& y) {
mtkleinf8f90e42016-03-21 10:04:46 -0700153 return { Half::Min(x.fLo, y.fLo), Half::Min(x.fHi, y.fHi) };
154 }
Mike Klein7c78f3a2016-10-19 09:21:11 -0400155 AI static SkNx Max(const SkNx& x, const SkNx& y) {
mtkleinf8f90e42016-03-21 10:04:46 -0700156 return { Half::Max(x.fLo, y.fLo), Half::Max(x.fHi, y.fHi) };
157 }
mtklein115acee2015-04-14 14:02:52 -0700158};
159
mtkleinf8f90e42016-03-21 10:04:46 -0700160// The N -> N/2 recursion bottoms out at N == 1, a scalar value.
mtkleinc9adb052015-03-30 10:50:27 -0700161template <typename T>
mtkleinf8f90e42016-03-21 10:04:46 -0700162struct SkNx<1,T> {
163 T fVal;
mtkleine4c0bee2016-02-09 10:35:27 -0800164
Mike Klein7c78f3a2016-10-19 09:21:11 -0400165 AI SkNx() = default;
166 AI SkNx(T v) : fVal(v) {}
mtkleinc9adb052015-03-30 10:50:27 -0700167
reed12644722016-07-12 09:12:30 -0700168 // Android complains against unused parameters, so we guard it
Mike Klein7c78f3a2016-10-19 09:21:11 -0400169 AI T operator[](int SkDEBUGCODE(k)) const {
mtkleinf8f90e42016-03-21 10:04:46 -0700170 SkASSERT(k == 0);
mtkleinc9adb052015-03-30 10:50:27 -0700171 return fVal;
172 }
173
Mike Klein7c78f3a2016-10-19 09:21:11 -0400174 AI static SkNx Load(const void* ptr) {
mtkleinf8f90e42016-03-21 10:04:46 -0700175 SkNx v;
176 memcpy(&v, ptr, sizeof(T));
177 return v;
178 }
Mike Klein7c78f3a2016-10-19 09:21:11 -0400179 AI void store(void* ptr) const { memcpy(ptr, &fVal, sizeof(T)); }
mtkleinf8f90e42016-03-21 10:04:46 -0700180
Mike Klein7c78f3a2016-10-19 09:21:11 -0400181 AI static void Load4(const void* vptr, SkNx* a, SkNx* b, SkNx* c, SkNx* d) {
Mike Klein33cbfd72016-10-06 11:09:27 -0400182 auto ptr = (const char*)vptr;
183 *a = Load(ptr + 0*sizeof(T));
184 *b = Load(ptr + 1*sizeof(T));
185 *c = Load(ptr + 2*sizeof(T));
186 *d = Load(ptr + 3*sizeof(T));
187 }
Matt Sarett5bee0b62017-01-19 12:04:32 -0500188 AI static void Load3(const void* vptr, SkNx* a, SkNx* b, SkNx* c) {
189 auto ptr = (const char*)vptr;
190 *a = Load(ptr + 0*sizeof(T));
191 *b = Load(ptr + 1*sizeof(T));
192 *c = Load(ptr + 2*sizeof(T));
193 }
Mike Klein213d8212017-11-30 12:07:20 -0500194 AI static void Load2(const void* vptr, SkNx* a, SkNx* b) {
195 auto ptr = (const char*)vptr;
196 *a = Load(ptr + 0*sizeof(T));
197 *b = Load(ptr + 1*sizeof(T));
198 }
Mike Klein7c78f3a2016-10-19 09:21:11 -0400199 AI static void Store4(void* vptr, const SkNx& a, const SkNx& b, const SkNx& c, const SkNx& d) {
Mike Klein33cbfd72016-10-06 11:09:27 -0400200 auto ptr = (char*)vptr;
201 a.store(ptr + 0*sizeof(T));
202 b.store(ptr + 1*sizeof(T));
203 c.store(ptr + 2*sizeof(T));
204 d.store(ptr + 3*sizeof(T));
205 }
Chris Dalton0cb75872017-12-01 13:23:05 -0700206 AI static void Store3(void* vptr, const SkNx& a, const SkNx& b, const SkNx& c) {
207 auto ptr = (char*)vptr;
208 a.store(ptr + 0*sizeof(T));
209 b.store(ptr + 1*sizeof(T));
210 c.store(ptr + 2*sizeof(T));
211 }
Chris Dalton42f02aa2018-04-08 23:58:43 -0600212 AI static void Store2(void* vptr, const SkNx& a, const SkNx& b) {
213 auto ptr = (char*)vptr;
214 a.store(ptr + 0*sizeof(T));
215 b.store(ptr + 1*sizeof(T));
216 }
Mike Klein33cbfd72016-10-06 11:09:27 -0400217
Chris Daltone3fda932018-04-11 13:18:09 -0600218 AI T min() const { return fVal; }
219 AI T max() const { return fVal; }
Mike Klein7c78f3a2016-10-19 09:21:11 -0400220 AI bool anyTrue() const { return fVal != 0; }
221 AI bool allTrue() const { return fVal != 0; }
mtkleinf8f90e42016-03-21 10:04:46 -0700222
Mike Klein7c78f3a2016-10-19 09:21:11 -0400223 AI SkNx abs() const { return Abs(fVal); }
224 AI SkNx sqrt() const { return Sqrt(fVal); }
225 AI SkNx rsqrt() const { return T(1) / this->sqrt(); }
226 AI SkNx floor() const { return Floor(fVal); }
227 AI SkNx invert() const { return T(1) / *this; }
mtkleinf8f90e42016-03-21 10:04:46 -0700228
Mike Klein7c78f3a2016-10-19 09:21:11 -0400229 AI SkNx operator!() const { return !fVal; }
230 AI SkNx operator-() const { return -fVal; }
231 AI SkNx operator~() const { return FromBits(~ToBits(fVal)); }
mtkleinf8f90e42016-03-21 10:04:46 -0700232
Mike Klein7c78f3a2016-10-19 09:21:11 -0400233 AI SkNx operator<<(int bits) const { return fVal << bits; }
234 AI SkNx operator>>(int bits) const { return fVal >> bits; }
mtkleinf8f90e42016-03-21 10:04:46 -0700235
Mike Klein7c78f3a2016-10-19 09:21:11 -0400236 AI SkNx operator+(const SkNx& y) const { return fVal + y.fVal; }
237 AI SkNx operator-(const SkNx& y) const { return fVal - y.fVal; }
238 AI SkNx operator*(const SkNx& y) const { return fVal * y.fVal; }
239 AI SkNx operator/(const SkNx& y) const { return fVal / y.fVal; }
mtkleinf8f90e42016-03-21 10:04:46 -0700240
Mike Klein7c78f3a2016-10-19 09:21:11 -0400241 AI SkNx operator&(const SkNx& y) const { return FromBits(ToBits(fVal) & ToBits(y.fVal)); }
242 AI SkNx operator|(const SkNx& y) const { return FromBits(ToBits(fVal) | ToBits(y.fVal)); }
243 AI SkNx operator^(const SkNx& y) const { return FromBits(ToBits(fVal) ^ ToBits(y.fVal)); }
mtkleinf8f90e42016-03-21 10:04:46 -0700244
Mike Klein7c78f3a2016-10-19 09:21:11 -0400245 AI SkNx operator==(const SkNx& y) const { return FromBits(fVal == y.fVal ? ~0 : 0); }
246 AI SkNx operator!=(const SkNx& y) const { return FromBits(fVal != y.fVal ? ~0 : 0); }
247 AI SkNx operator<=(const SkNx& y) const { return FromBits(fVal <= y.fVal ? ~0 : 0); }
248 AI SkNx operator>=(const SkNx& y) const { return FromBits(fVal >= y.fVal ? ~0 : 0); }
249 AI SkNx operator< (const SkNx& y) const { return FromBits(fVal < y.fVal ? ~0 : 0); }
250 AI SkNx operator> (const SkNx& y) const { return FromBits(fVal > y.fVal ? ~0 : 0); }
mtkleinf8f90e42016-03-21 10:04:46 -0700251
Mike Klein7c78f3a2016-10-19 09:21:11 -0400252 AI static SkNx Min(const SkNx& x, const SkNx& y) { return x.fVal < y.fVal ? x : y; }
253 AI static SkNx Max(const SkNx& x, const SkNx& y) { return x.fVal > y.fVal ? x : y; }
mtkleinf8f90e42016-03-21 10:04:46 -0700254
Mike Klein7c78f3a2016-10-19 09:21:11 -0400255 AI SkNx saturatedAdd(const SkNx& y) const {
mtkleinf8f90e42016-03-21 10:04:46 -0700256 static_assert(std::is_unsigned<T>::value, "");
257 T sum = fVal + y.fVal;
258 return sum < fVal ? std::numeric_limits<T>::max() : sum;
259 }
260
Herb Derby5eb15282017-10-10 17:14:18 -0400261 AI SkNx mulHi(const SkNx& m) const {
262 static_assert(std::is_unsigned<T>::value, "");
263 static_assert(sizeof(T) <= 4, "");
264 return static_cast<T>((static_cast<uint64_t>(fVal) * m.fVal) >> (sizeof(T)*8));
265 }
266
Mike Klein7c78f3a2016-10-19 09:21:11 -0400267 AI SkNx thenElse(const SkNx& t, const SkNx& e) const { return fVal != 0 ? t : e; }
mtkleinb5e86112015-06-24 15:18:39 -0700268
mtkleinf8f90e42016-03-21 10:04:46 -0700269private:
270 // Helper functions to choose the right float/double methods. (In <cmath> madness lies...)
Yuqian Li7da6ba22017-07-12 13:36:05 -0400271 AI static int Abs(int val) { return val < 0 ? -val : val; }
272
Mike Klein7c78f3a2016-10-19 09:21:11 -0400273 AI static float Abs(float val) { return ::fabsf(val); }
274 AI static float Sqrt(float val) { return ::sqrtf(val); }
275 AI static float Floor(float val) { return ::floorf(val); }
mtkleinb5e86112015-06-24 15:18:39 -0700276
Mike Klein7c78f3a2016-10-19 09:21:11 -0400277 AI static double Abs(double val) { return ::fabs(val); }
278 AI static double Sqrt(double val) { return ::sqrt(val); }
279 AI static double Floor(double val) { return ::floor(val); }
mtkleinf8f90e42016-03-21 10:04:46 -0700280
281 // Helper functions for working with floats/doubles as bit patterns.
Mike Klein7c78f3a2016-10-19 09:21:11 -0400282 template <typename U>
283 AI static U ToBits(U v) { return v; }
284 AI static int32_t ToBits(float v) { int32_t bits; memcpy(&bits, &v, sizeof(v)); return bits; }
285 AI static int64_t ToBits(double v) { int64_t bits; memcpy(&bits, &v, sizeof(v)); return bits; }
mtkleinf8f90e42016-03-21 10:04:46 -0700286
Mike Klein7c78f3a2016-10-19 09:21:11 -0400287 template <typename Bits>
288 AI static T FromBits(Bits bits) {
mtkleinf8f90e42016-03-21 10:04:46 -0700289 static_assert(std::is_pod<T >::value &&
290 std::is_pod<Bits>::value &&
291 sizeof(T) <= sizeof(Bits), "");
292 T val;
293 memcpy(&val, &bits, sizeof(T));
294 return val;
295 }
mtkleinc9adb052015-03-30 10:50:27 -0700296};
297
mtkleinf8f90e42016-03-21 10:04:46 -0700298// Allow scalars on the left or right of binary operators, and things like +=, &=, etc.
Mike Klein7c78f3a2016-10-19 09:21:11 -0400299#define V template <int N, typename T> AI static SkNx<N,T>
mtkleinf8f90e42016-03-21 10:04:46 -0700300 V operator+ (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) + y; }
301 V operator- (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) - y; }
302 V operator* (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) * y; }
303 V operator/ (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) / y; }
304 V operator& (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) & y; }
305 V operator| (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) | y; }
306 V operator^ (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) ^ y; }
307 V operator==(T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) == y; }
308 V operator!=(T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) != y; }
309 V operator<=(T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) <= y; }
310 V operator>=(T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) >= y; }
311 V operator< (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) < y; }
312 V operator> (T x, const SkNx<N,T>& y) { return SkNx<N,T>(x) > y; }
313
314 V operator+ (const SkNx<N,T>& x, T y) { return x + SkNx<N,T>(y); }
315 V operator- (const SkNx<N,T>& x, T y) { return x - SkNx<N,T>(y); }
316 V operator* (const SkNx<N,T>& x, T y) { return x * SkNx<N,T>(y); }
317 V operator/ (const SkNx<N,T>& x, T y) { return x / SkNx<N,T>(y); }
318 V operator& (const SkNx<N,T>& x, T y) { return x & SkNx<N,T>(y); }
319 V operator| (const SkNx<N,T>& x, T y) { return x | SkNx<N,T>(y); }
320 V operator^ (const SkNx<N,T>& x, T y) { return x ^ SkNx<N,T>(y); }
321 V operator==(const SkNx<N,T>& x, T y) { return x == SkNx<N,T>(y); }
322 V operator!=(const SkNx<N,T>& x, T y) { return x != SkNx<N,T>(y); }
323 V operator<=(const SkNx<N,T>& x, T y) { return x <= SkNx<N,T>(y); }
324 V operator>=(const SkNx<N,T>& x, T y) { return x >= SkNx<N,T>(y); }
325 V operator< (const SkNx<N,T>& x, T y) { return x < SkNx<N,T>(y); }
326 V operator> (const SkNx<N,T>& x, T y) { return x > SkNx<N,T>(y); }
327
328 V& operator<<=(SkNx<N,T>& x, int bits) { return (x = x << bits); }
329 V& operator>>=(SkNx<N,T>& x, int bits) { return (x = x >> bits); }
330
331 V& operator +=(SkNx<N,T>& x, const SkNx<N,T>& y) { return (x = x + y); }
332 V& operator -=(SkNx<N,T>& x, const SkNx<N,T>& y) { return (x = x - y); }
333 V& operator *=(SkNx<N,T>& x, const SkNx<N,T>& y) { return (x = x * y); }
334 V& operator /=(SkNx<N,T>& x, const SkNx<N,T>& y) { return (x = x / y); }
335 V& operator &=(SkNx<N,T>& x, const SkNx<N,T>& y) { return (x = x & y); }
336 V& operator |=(SkNx<N,T>& x, const SkNx<N,T>& y) { return (x = x | y); }
337 V& operator ^=(SkNx<N,T>& x, const SkNx<N,T>& y) { return (x = x ^ y); }
338
339 V& operator +=(SkNx<N,T>& x, T y) { return (x = x + SkNx<N,T>(y)); }
340 V& operator -=(SkNx<N,T>& x, T y) { return (x = x - SkNx<N,T>(y)); }
341 V& operator *=(SkNx<N,T>& x, T y) { return (x = x * SkNx<N,T>(y)); }
342 V& operator /=(SkNx<N,T>& x, T y) { return (x = x / SkNx<N,T>(y)); }
343 V& operator &=(SkNx<N,T>& x, T y) { return (x = x & SkNx<N,T>(y)); }
344 V& operator |=(SkNx<N,T>& x, T y) { return (x = x | SkNx<N,T>(y)); }
345 V& operator ^=(SkNx<N,T>& x, T y) { return (x = x ^ SkNx<N,T>(y)); }
346#undef V
347
348// SkNx<N,T> ~~> SkNx<N/2,T> + SkNx<N/2,T>
349template <int N, typename T>
Mike Klein7c78f3a2016-10-19 09:21:11 -0400350AI static void SkNx_split(const SkNx<N,T>& v, SkNx<N/2,T>* lo, SkNx<N/2,T>* hi) {
mtkleinf8f90e42016-03-21 10:04:46 -0700351 *lo = v.fLo;
352 *hi = v.fHi;
353}
354
355// SkNx<N/2,T> + SkNx<N/2,T> ~~> SkNx<N,T>
356template <int N, typename T>
Mike Klein7c78f3a2016-10-19 09:21:11 -0400357AI static SkNx<N*2,T> SkNx_join(const SkNx<N,T>& lo, const SkNx<N,T>& hi) {
mtkleinf8f90e42016-03-21 10:04:46 -0700358 return { lo, hi };
359}
360
361// A very generic shuffle. Can reorder, duplicate, contract, expand...
362// Sk4f v = { R,G,B,A };
363// SkNx_shuffle<2,1,0,3>(v) ~~> {B,G,R,A}
364// SkNx_shuffle<2,1>(v) ~~> {B,G}
365// SkNx_shuffle<2,1,2,1,2,1,2,1>(v) ~~> {B,G,B,G,B,G,B,G}
366// SkNx_shuffle<3,3,3,3>(v) ~~> {A,A,A,A}
mtkleine4c0bee2016-02-09 10:35:27 -0800367template <int... Ix, int N, typename T>
Mike Klein7c78f3a2016-10-19 09:21:11 -0400368AI static SkNx<sizeof...(Ix),T> SkNx_shuffle(const SkNx<N,T>& v) {
mtkleinf8f90e42016-03-21 10:04:46 -0700369 return { v[Ix]... };
mtklein6c221b42015-11-20 13:53:19 -0800370}
mtkleina1c0ee42015-09-10 14:16:07 -0700371
mtkleinf8f90e42016-03-21 10:04:46 -0700372// Cast from SkNx<N, Src> to SkNx<N, Dst>, as if you called static_cast<Dst>(Src).
373template <typename Dst, typename Src, int N>
Mike Klein7c78f3a2016-10-19 09:21:11 -0400374AI static SkNx<N,Dst> SkNx_cast(const SkNx<N,Src>& v) {
mtkleinf8f90e42016-03-21 10:04:46 -0700375 return { SkNx_cast<Dst>(v.fLo), SkNx_cast<Dst>(v.fHi) };
mtkleine4c0bee2016-02-09 10:35:27 -0800376}
mtkleinf8f90e42016-03-21 10:04:46 -0700377template <typename Dst, typename Src>
Mike Klein7c78f3a2016-10-19 09:21:11 -0400378AI static SkNx<1,Dst> SkNx_cast(const SkNx<1,Src>& v) {
mtkleinf8f90e42016-03-21 10:04:46 -0700379 return static_cast<Dst>(v.fVal);
mtkleine4c0bee2016-02-09 10:35:27 -0800380}
mtkleinfce612a2015-12-15 07:38:54 -0800381
Mike Klein04adfda2016-10-12 09:52:55 -0400382template <int N, typename T>
Mike Klein7c78f3a2016-10-19 09:21:11 -0400383AI static SkNx<N,T> SkNx_fma(const SkNx<N,T>& f, const SkNx<N,T>& m, const SkNx<N,T>& a) {
Mike Klein04adfda2016-10-12 09:52:55 -0400384 return f*m+a;
385}
386
Mike Klein1e764642016-10-14 17:09:03 -0400387} // namespace
388
mtkleine4c0bee2016-02-09 10:35:27 -0800389typedef SkNx<2, float> Sk2f;
390typedef SkNx<4, float> Sk4f;
mtkleinf8f90e42016-03-21 10:04:46 -0700391typedef SkNx<8, float> Sk8f;
392typedef SkNx<16, float> Sk16f;
393
mtkleine4c0bee2016-02-09 10:35:27 -0800394typedef SkNx<2, SkScalar> Sk2s;
395typedef SkNx<4, SkScalar> Sk4s;
mtkleinf8f90e42016-03-21 10:04:46 -0700396typedef SkNx<8, SkScalar> Sk8s;
397typedef SkNx<16, SkScalar> Sk16s;
mtkleinc9adb052015-03-30 10:50:27 -0700398
mtkleine4c0bee2016-02-09 10:35:27 -0800399typedef SkNx<4, uint8_t> Sk4b;
mtkleinf8f90e42016-03-21 10:04:46 -0700400typedef SkNx<8, uint8_t> Sk8b;
mtkleine4c0bee2016-02-09 10:35:27 -0800401typedef SkNx<16, uint8_t> Sk16b;
mtklein6f37b4a2015-12-14 11:25:18 -0800402
mtkleinf8f90e42016-03-21 10:04:46 -0700403typedef SkNx<4, uint16_t> Sk4h;
404typedef SkNx<8, uint16_t> Sk8h;
405typedef SkNx<16, uint16_t> Sk16h;
406
mtkleind05a8752016-07-29 10:10:15 -0700407typedef SkNx<4, int32_t> Sk4i;
Mike Klein04adfda2016-10-12 09:52:55 -0400408typedef SkNx<8, int32_t> Sk8i;
mtkleind05a8752016-07-29 10:10:15 -0700409typedef SkNx<4, uint32_t> Sk4u;
mtkleinff9febf2016-02-16 14:33:08 -0800410
mtklein6f37b4a2015-12-14 11:25:18 -0800411// Include platform specific specializations if available.
mtklein81bb79b2016-02-08 15:50:22 -0800412#if !defined(SKNX_NO_SIMD) && SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2
Mike Kleinc0bd9f92019-04-23 12:05:21 -0500413 #include "include/private/SkNx_sse.h"
mtklein6f37b4a2015-12-14 11:25:18 -0800414#elif !defined(SKNX_NO_SIMD) && defined(SK_ARM_HAS_NEON)
Mike Kleinc0bd9f92019-04-23 12:05:21 -0500415 #include "include/private/SkNx_neon.h"
msarett7d3ff712016-07-12 14:55:45 -0700416#else
417
Mike Klein7c78f3a2016-10-19 09:21:11 -0400418AI static Sk4i Sk4f_round(const Sk4f& x) {
msarett7d3ff712016-07-12 14:55:45 -0700419 return { (int) lrintf (x[0]),
420 (int) lrintf (x[1]),
421 (int) lrintf (x[2]),
422 (int) lrintf (x[3]), };
423}
424
mtklein6f37b4a2015-12-14 11:25:18 -0800425#endif
426
Mike Klein7c78f3a2016-10-19 09:21:11 -0400427AI static void Sk4f_ToBytes(uint8_t p[16],
428 const Sk4f& a, const Sk4f& b, const Sk4f& c, const Sk4f& d) {
mtkleinf8f90e42016-03-21 10:04:46 -0700429 SkNx_cast<uint8_t>(SkNx_join(SkNx_join(a,b), SkNx_join(c,d))).store(p);
430}
431
Mike Klein7c78f3a2016-10-19 09:21:11 -0400432#undef AI
mtkleinf8f90e42016-03-21 10:04:46 -0700433
mtklein3e490b72015-03-20 06:33:02 -0700434#endif//SkNx_DEFINED