| OLD | NEW |
| 1 /* | 1 /* |
| 2 * Copyright 2015 Google Inc. | 2 * Copyright 2015 Google Inc. |
| 3 * | 3 * |
| 4 * Use of this source code is governed by a BSD-style license that can be | 4 * Use of this source code is governed by a BSD-style license that can be |
| 5 * found in the LICENSE file. | 5 * found in the LICENSE file. |
| 6 */ | 6 */ |
| 7 | 7 |
| 8 #ifndef SkNx_DEFINED | 8 #ifndef SkNx_DEFINED |
| 9 #define SkNx_DEFINED | 9 #define SkNx_DEFINED |
| 10 | 10 |
| 11 | 11 |
| 12 #define SKNX_NO_SIMDx // Remove the x to disable SIMD for all SkNx types. | 12 #define SKNX_NO_SIMDx // Remove the x to disable SIMD for all SkNx types. |
| 13 | 13 |
| 14 | 14 |
| 15 #include "SkScalar.h" | 15 #include "SkScalar.h" |
| 16 #include "SkTypes.h" | 16 #include "SkTypes.h" |
| 17 #include <math.h> | 17 #include <math.h> |
| 18 #define REQUIRE(x) static_assert(x, #x) | 18 #define REQUIRE(x) static_assert(x, #x) |
| 19 | 19 |
| 20 // This file may be included multiple times by .cpp files with different flags,
leading | 20 // This file may be included multiple times by .cpp files with different flags,
leading |
| 21 // to different definitions. Usually that doesn't matter because it's all inlin
ed, but | 21 // to different definitions. Usually that doesn't matter because it's all inlin
ed, but |
| 22 // in Debug modes the compilers may not inline everything. So wrap everything i
n an | 22 // in Debug modes the compilers may not inline everything. So wrap everything i
n an |
| 23 // anonymous namespace to give each includer their own silo of this code (or the
linker | 23 // anonymous namespace to give each includer their own silo of this code (or the
linker |
| 24 // will probably pick one randomly for us, which is rarely correct). | 24 // will probably pick one randomly for us, which is rarely correct). |
| 25 namespace { | 25 namespace { |
| 26 | 26 |
| 27 // The default implementations just fall back on a pair of size N/2. | 27 // The default implementations just fall back on a pair of size N/2. |
| 28 | 28 |
| 29 template <int N, typename T> | 29 template <int N, typename T> |
| 30 class SkNi { | 30 class SkNx { |
| 31 public: | 31 public: |
| 32 SkNi() {} | 32 SkNx() {} |
| 33 SkNi(const SkNi<N/2, T>& lo, const SkNi<N/2, T>& hi) : fLo(lo), fHi(hi) {} | 33 SkNx(const SkNx<N/2, T>& lo, const SkNx<N/2, T>& hi) : fLo(lo), fHi(hi) {} |
| 34 SkNi(T val) : fLo(val), fHi(val) {} | 34 SkNx(T val) : fLo(val), fHi(val) {} |
| 35 static SkNi Load(const T vals[N]) { | 35 static SkNx Load(const T vals[N]) { |
| 36 return SkNi(SkNi<N/2,T>::Load(vals), SkNi<N/2,T>::Load(vals+N/2)); | 36 return SkNx(SkNx<N/2,T>::Load(vals), SkNx<N/2,T>::Load(vals+N/2)); |
| 37 } | 37 } |
| 38 | 38 |
| 39 SkNi(T a, T b) : fLo(a), fHi(b) {
REQUIRE(N==2); } | 39 SkNx(T a, T b) : fLo(a), fHi(b) {
REQUIRE(N==2); } |
| 40 SkNi(T a, T b, T c, T d) : fLo(a,b), fHi(c,d) {
REQUIRE(N==4); } | 40 SkNx(T a, T b, T c, T d) : fLo(a,b), fHi(c,d) {
REQUIRE(N==4); } |
| 41 SkNi(T a, T b, T c, T d, T e, T f, T g, T h) : fLo(a,b,c,d), fHi(e,f,g,h) {
REQUIRE(N==8); } | 41 SkNx(T a, T b, T c, T d, T e, T f, T g, T h) : fLo(a,b,c,d), fHi(e,f,g,h) {
REQUIRE(N==8); } |
| 42 SkNi(T a, T b, T c, T d, T e, T f, T g, T h, | 42 SkNx(T a, T b, T c, T d, T e, T f, T g, T h, |
| 43 T i, T j, T k, T l, T m, T n, T o, T p) | 43 T i, T j, T k, T l, T m, T n, T o, T p) |
| 44 : fLo(a,b,c,d, e,f,g,h), fHi(i,j,k,l, m,n,o,p) { REQUIRE(N==16); } | 44 : fLo(a,b,c,d, e,f,g,h), fHi(i,j,k,l, m,n,o,p) { REQUIRE(N==16); } |
| 45 | 45 |
| 46 void store(T vals[N]) const { | 46 void store(T vals[N]) const { |
| 47 fLo.store(vals); | 47 fLo.store(vals); |
| 48 fHi.store(vals+N/2); | 48 fHi.store(vals+N/2); |
| 49 } | 49 } |
| 50 | 50 |
| 51 SkNi saturatedAdd(const SkNi& o) const { | 51 SkNx saturatedAdd(const SkNx& o) const { |
| 52 return SkNi(fLo.saturatedAdd(o.fLo), fHi.saturatedAdd(o.fHi)); | 52 return SkNx(fLo.saturatedAdd(o.fLo), fHi.saturatedAdd(o.fHi)); |
| 53 } | 53 } |
| 54 | 54 |
| 55 SkNi operator + (const SkNi& o) const { return SkNi(fLo + o.fLo, fHi + o.fHi
); } | 55 SkNx operator + (const SkNx& o) const { return SkNx(fLo + o.fLo, fHi + o.fHi
); } |
| 56 SkNi operator - (const SkNi& o) const { return SkNi(fLo - o.fLo, fHi - o.fHi
); } | 56 SkNx operator - (const SkNx& o) const { return SkNx(fLo - o.fLo, fHi - o.fHi
); } |
| 57 SkNi operator * (const SkNi& o) const { return SkNi(fLo * o.fLo, fHi * o.fHi
); } | 57 SkNx operator * (const SkNx& o) const { return SkNx(fLo * o.fLo, fHi * o.fHi
); } |
| 58 | 58 |
| 59 SkNi operator << (int bits) const { return SkNi(fLo << bits, fHi << bits); } | 59 SkNx operator << (int bits) const { return SkNx(fLo << bits, fHi << bits); } |
| 60 SkNi operator >> (int bits) const { return SkNi(fLo >> bits, fHi >> bits); } | 60 SkNx operator >> (int bits) const { return SkNx(fLo >> bits, fHi >> bits); } |
| 61 | 61 |
| 62 static SkNi Min(const SkNi& a, const SkNi& b) { | 62 static SkNx Min(const SkNx& a, const SkNx& b) { |
| 63 return SkNi(SkNi<N/2, T>::Min(a.fLo, b.fLo), SkNi<N/2, T>::Min(a.fHi, b.
fHi)); | 63 return SkNx(SkNx<N/2, T>::Min(a.fLo, b.fLo), SkNx<N/2, T>::Min(a.fHi, b.
fHi)); |
| 64 } | 64 } |
| 65 SkNi operator < (const SkNi& o) const { return SkNi(fLo < o.fLo, fHi < o.fHi
); } | 65 SkNx operator < (const SkNx& o) const { return SkNx(fLo < o.fLo, fHi < o.fHi
); } |
| 66 | 66 |
| 67 template <int k> T kth() const { | 67 template <int k> T kth() const { |
| 68 SkASSERT(0 <= k && k < N); | 68 SkASSERT(0 <= k && k < N); |
| 69 return k < N/2 ? fLo.template kth<k>() : fHi.template kth<k-N/2>(); | 69 return k < N/2 ? fLo.template kth<k>() : fHi.template kth<k-N/2>(); |
| 70 } | 70 } |
| 71 | 71 |
| 72 bool allTrue() const { return fLo.allTrue() && fHi.allTrue(); } | 72 bool allTrue() const { return fLo.allTrue() && fHi.allTrue(); } |
| 73 bool anyTrue() const { return fLo.anyTrue() || fHi.anyTrue(); } | 73 bool anyTrue() const { return fLo.anyTrue() || fHi.anyTrue(); } |
| 74 SkNi thenElse(const SkNi& t, const SkNi& e) const { | 74 SkNx thenElse(const SkNx& t, const SkNx& e) const { |
| 75 return SkNi(fLo.thenElse(t.fLo, e.fLo), fHi.thenElse(t.fHi, e.fHi)); | 75 return SkNx(fLo.thenElse(t.fLo, e.fLo), fHi.thenElse(t.fHi, e.fHi)); |
| 76 } | 76 } |
| 77 | 77 |
| 78 protected: | 78 protected: |
| 79 REQUIRE(0 == (N & (N-1))); | 79 REQUIRE(0 == (N & (N-1))); |
| 80 | 80 |
| 81 SkNi<N/2, T> fLo, fHi; | 81 SkNx<N/2, T> fLo, fHi; |
| 82 }; | 82 }; |
| 83 | 83 |
| 84 template <int N> | 84 template <int N> |
| 85 class SkNf { | 85 class SkNx<N,float> { |
| 86 public: | 86 public: |
| 87 SkNf() {} | 87 SkNx() {} |
| 88 SkNf(float val) : fLo(val), fHi(val) {} | 88 SkNx(float val) : fLo(val), fHi(val) {} |
| 89 static SkNf Load(const float vals[N]) { | 89 static SkNx Load(const float vals[N]) { |
| 90 return SkNf(SkNf<N/2>::Load(vals), SkNf<N/2>::Load(vals+N/2)); | 90 return SkNx(SkNx<N/2, float>::Load(vals), SkNx<N/2, float>::Load(vals+N/
2)); |
| 91 } | 91 } |
| 92 // FromBytes() and toBytes() specializations may assume their argument is N-
byte aligned. | 92 // FromBytes() and toBytes() specializations may assume their argument is N-
byte aligned. |
| 93 // E.g. Sk4f::FromBytes() may assume it's reading from a 4-byte-aligned poin
ter. | 93 // E.g. Sk4f::FromBytes() may assume it's reading from a 4-byte-aligned poin
ter. |
| 94 // Converts [0,255] bytes to [0.0, 255.0] floats. | 94 // Converts [0,255] bytes to [0.0, 255.0] floats. |
| 95 static SkNf FromBytes(const uint8_t bytes[N]) { | 95 static SkNx FromBytes(const uint8_t bytes[N]) { |
| 96 return SkNf(SkNf<N/2>::FromBytes(bytes), SkNf<N/2>::FromBytes(bytes+N/2)
); | 96 return SkNx(SkNx<N/2, float>::FromBytes(bytes), SkNx<N/2, float>::FromBy
tes(bytes+N/2)); |
| 97 } | 97 } |
| 98 | 98 |
| 99 SkNf(float a, float b) : fLo(a), fHi(b) { REQUIRE(N==2
); } | 99 SkNx(float a, float b) : fLo(a), fHi(b) { REQUIRE(N==2
); } |
| 100 SkNf(float a, float b, float c, float d) : fLo(a,b), fHi(c,d) { REQUIRE(N==4
); } | 100 SkNx(float a, float b, float c, float d) : fLo(a,b), fHi(c,d) { REQUIRE(N==4
); } |
| 101 SkNf(float a, float b, float c, float d, float e, float f, float g, float h) | 101 SkNx(float a, float b, float c, float d, float e, float f, float g, float h) |
| 102 : fLo(a,b,c,d) | 102 : fLo(a,b,c,d) |
| 103 , fHi(e,f,g,h) { REQUIRE(N==8); } | 103 , fHi(e,f,g,h) { REQUIRE(N==8); } |
| 104 | 104 |
| 105 void store(float vals[N]) const { | 105 void store(float vals[N]) const { |
| 106 fLo.store(vals); | 106 fLo.store(vals); |
| 107 fHi.store(vals+N/2); | 107 fHi.store(vals+N/2); |
| 108 } | 108 } |
| 109 // Please see note on FromBytes(). | 109 // Please see note on FromBytes(). |
| 110 // Clamps to [0.0,255.0] floats and truncates to [0,255] bytes. | 110 // Clamps to [0.0,255.0] floats and truncates to [0,255] bytes. |
| 111 void toBytes(uint8_t bytes[N]) const { | 111 void toBytes(uint8_t bytes[N]) const { |
| 112 fLo.toBytes(bytes); | 112 fLo.toBytes(bytes); |
| 113 fHi.toBytes(bytes+N/2); | 113 fHi.toBytes(bytes+N/2); |
| 114 } | 114 } |
| 115 | 115 |
| 116 SkNf operator + (const SkNf& o) const { return SkNf(fLo + o.fLo, fHi + o.fHi
); } | 116 SkNx operator + (const SkNx& o) const { return SkNx(fLo + o.fLo, fHi + o.fHi
); } |
| 117 SkNf operator - (const SkNf& o) const { return SkNf(fLo - o.fLo, fHi - o.fHi
); } | 117 SkNx operator - (const SkNx& o) const { return SkNx(fLo - o.fLo, fHi - o.fHi
); } |
| 118 SkNf operator * (const SkNf& o) const { return SkNf(fLo * o.fLo, fHi * o.fHi
); } | 118 SkNx operator * (const SkNx& o) const { return SkNx(fLo * o.fLo, fHi * o.fHi
); } |
| 119 SkNf operator / (const SkNf& o) const { return SkNf(fLo / o.fLo, fHi / o.fHi
); } | 119 SkNx operator / (const SkNx& o) const { return SkNx(fLo / o.fLo, fHi / o.fHi
); } |
| 120 | 120 |
| 121 SkNf operator == (const SkNf& o) const { return SkNf(fLo == o.fLo, fHi == o.
fHi); } | 121 SkNx operator == (const SkNx& o) const { return SkNx(fLo == o.fLo, fHi == o.
fHi); } |
| 122 SkNf operator != (const SkNf& o) const { return SkNf(fLo != o.fLo, fHi != o.
fHi); } | 122 SkNx operator != (const SkNx& o) const { return SkNx(fLo != o.fLo, fHi != o.
fHi); } |
| 123 SkNf operator < (const SkNf& o) const { return SkNf(fLo < o.fLo, fHi < o.
fHi); } | 123 SkNx operator < (const SkNx& o) const { return SkNx(fLo < o.fLo, fHi < o.
fHi); } |
| 124 SkNf operator > (const SkNf& o) const { return SkNf(fLo > o.fLo, fHi > o.
fHi); } | 124 SkNx operator > (const SkNx& o) const { return SkNx(fLo > o.fLo, fHi > o.
fHi); } |
| 125 SkNf operator <= (const SkNf& o) const { return SkNf(fLo <= o.fLo, fHi <= o.
fHi); } | 125 SkNx operator <= (const SkNx& o) const { return SkNx(fLo <= o.fLo, fHi <= o.
fHi); } |
| 126 SkNf operator >= (const SkNf& o) const { return SkNf(fLo >= o.fLo, fHi >= o.
fHi); } | 126 SkNx operator >= (const SkNx& o) const { return SkNx(fLo >= o.fLo, fHi >= o.
fHi); } |
| 127 | 127 |
| 128 static SkNf Min(const SkNf& l, const SkNf& r) { | 128 static SkNx Min(const SkNx& l, const SkNx& r) { |
| 129 return SkNf(SkNf<N/2>::Min(l.fLo, r.fLo), SkNf<N/2>::Min(l.fHi, r.fHi)); | 129 return SkNx(SkNx<N/2, float>::Min(l.fLo, r.fLo), SkNx<N/2, float>::Min(l
.fHi, r.fHi)); |
| 130 } | 130 } |
| 131 static SkNf Max(const SkNf& l, const SkNf& r) { | 131 static SkNx Max(const SkNx& l, const SkNx& r) { |
| 132 return SkNf(SkNf<N/2>::Max(l.fLo, r.fLo), SkNf<N/2>::Max(l.fHi, r.fHi)); | 132 return SkNx(SkNx<N/2, float>::Max(l.fLo, r.fLo), SkNx<N/2, float>::Max(l
.fHi, r.fHi)); |
| 133 } | 133 } |
| 134 | 134 |
| 135 SkNf sqrt() const { return SkNf(fLo. sqrt(), fHi. sqrt()); } | 135 SkNx sqrt() const { return SkNx(fLo. sqrt(), fHi. sqrt()); } |
| 136 | 136 |
| 137 // Generally, increasing precision, increasing cost. | 137 // Generally, increasing precision, increasing cost. |
| 138 SkNf rsqrt0() const { return SkNf(fLo.rsqrt0(), fHi.rsqrt0()); } | 138 SkNx rsqrt0() const { return SkNx(fLo.rsqrt0(), fHi.rsqrt0()); } |
| 139 SkNf rsqrt1() const { return SkNf(fLo.rsqrt1(), fHi.rsqrt1()); } | 139 SkNx rsqrt1() const { return SkNx(fLo.rsqrt1(), fHi.rsqrt1()); } |
| 140 SkNf rsqrt2() const { return SkNf(fLo.rsqrt2(), fHi.rsqrt2()); } | 140 SkNx rsqrt2() const { return SkNx(fLo.rsqrt2(), fHi.rsqrt2()); } |
| 141 | 141 |
| 142 SkNf invert() const { return SkNf(fLo. invert(), fHi. invert
()); } | 142 SkNx invert() const { return SkNx(fLo. invert(), fHi. invert
()); } |
| 143 SkNf approxInvert() const { return SkNf(fLo.approxInvert(), fHi.approxInvert
()); } | 143 SkNx approxInvert() const { return SkNx(fLo.approxInvert(), fHi.approxInvert
()); } |
| 144 | 144 |
| 145 template <int k> float kth() const { | 145 template <int k> float kth() const { |
| 146 SkASSERT(0 <= k && k < N); | 146 SkASSERT(0 <= k && k < N); |
| 147 return k < N/2 ? fLo.template kth<k>() : fHi.template kth<k-N/2>(); | 147 return k < N/2 ? fLo.template kth<k>() : fHi.template kth<k-N/2>(); |
| 148 } | 148 } |
| 149 | 149 |
| 150 bool allTrue() const { return fLo.allTrue() && fHi.allTrue(); } | 150 bool allTrue() const { return fLo.allTrue() && fHi.allTrue(); } |
| 151 bool anyTrue() const { return fLo.anyTrue() || fHi.anyTrue(); } | 151 bool anyTrue() const { return fLo.anyTrue() || fHi.anyTrue(); } |
| 152 SkNf thenElse(const SkNf& t, const SkNf& e) const { | 152 SkNx thenElse(const SkNx& t, const SkNx& e) const { |
| 153 return SkNf(fLo.thenElse(t.fLo, e.fLo), fHi.thenElse(t.fHi, e.fHi)); | 153 return SkNx(fLo.thenElse(t.fLo, e.fLo), fHi.thenElse(t.fHi, e.fHi)); |
| 154 } | 154 } |
| 155 | 155 |
| 156 protected: | 156 protected: |
| 157 REQUIRE(0 == (N & (N-1))); | 157 REQUIRE(0 == (N & (N-1))); |
| 158 SkNf(const SkNf<N/2>& lo, const SkNf<N/2>& hi) : fLo(lo), fHi(hi) {} | 158 SkNx(const SkNx<N/2, float>& lo, const SkNx<N/2, float>& hi) : fLo(lo), fHi(
hi) {} |
| 159 | 159 |
| 160 SkNf<N/2> fLo, fHi; | 160 SkNx<N/2, float> fLo, fHi; |
| 161 }; | 161 }; |
| 162 | 162 |
| 163 | 163 |
| 164 // Bottom out the default implementations with scalars when nothing's been speci
alized. | 164 // Bottom out the default implementations with scalars when nothing's been speci
alized. |
| 165 | 165 |
| 166 template <typename T> | 166 template <typename T> |
| 167 class SkNi<1,T> { | 167 class SkNx<1,T> { |
| 168 public: | 168 public: |
| 169 SkNi() {} | 169 SkNx() {} |
| 170 SkNi(T val) : fVal(val) {} | 170 SkNx(T val) : fVal(val) {} |
| 171 static SkNi Load(const T vals[1]) { return SkNi(vals[0]); } | 171 static SkNx Load(const T vals[1]) { return SkNx(vals[0]); } |
| 172 | 172 |
| 173 void store(T vals[1]) const { vals[0] = fVal; } | 173 void store(T vals[1]) const { vals[0] = fVal; } |
| 174 | 174 |
| 175 SkNi saturatedAdd(const SkNi& o) const { | 175 SkNx saturatedAdd(const SkNx& o) const { |
| 176 SkASSERT((T)(~0) > 0); // TODO: support signed T | 176 SkASSERT((T)(~0) > 0); // TODO: support signed T |
| 177 T sum = fVal + o.fVal; | 177 T sum = fVal + o.fVal; |
| 178 return SkNi(sum < fVal ? (T)(~0) : sum); | 178 return SkNx(sum < fVal ? (T)(~0) : sum); |
| 179 } | 179 } |
| 180 | 180 |
| 181 SkNi operator + (const SkNi& o) const { return SkNi(fVal + o.fVal); } | 181 SkNx operator + (const SkNx& o) const { return SkNx(fVal + o.fVal); } |
| 182 SkNi operator - (const SkNi& o) const { return SkNi(fVal - o.fVal); } | 182 SkNx operator - (const SkNx& o) const { return SkNx(fVal - o.fVal); } |
| 183 SkNi operator * (const SkNi& o) const { return SkNi(fVal * o.fVal); } | 183 SkNx operator * (const SkNx& o) const { return SkNx(fVal * o.fVal); } |
| 184 | 184 |
| 185 SkNi operator << (int bits) const { return SkNi(fVal << bits); } | 185 SkNx operator << (int bits) const { return SkNx(fVal << bits); } |
| 186 SkNi operator >> (int bits) const { return SkNi(fVal >> bits); } | 186 SkNx operator >> (int bits) const { return SkNx(fVal >> bits); } |
| 187 | 187 |
| 188 static SkNi Min(const SkNi& a, const SkNi& b) { return SkNi(SkTMin(a.fVal, b
.fVal)); } | 188 static SkNx Min(const SkNx& a, const SkNx& b) { return SkNx(SkTMin(a.fVal, b
.fVal)); } |
| 189 SkNi operator <(const SkNi& o) const { return SkNi(fVal < o.fVal); } | 189 SkNx operator <(const SkNx& o) const { return SkNx(fVal < o.fVal); } |
| 190 | 190 |
| 191 template <int k> T kth() const { | 191 template <int k> T kth() const { |
| 192 SkASSERT(0 == k); | 192 SkASSERT(0 == k); |
| 193 return fVal; | 193 return fVal; |
| 194 } | 194 } |
| 195 | 195 |
| 196 bool allTrue() const { return fVal; } | 196 bool allTrue() const { return fVal; } |
| 197 bool anyTrue() const { return fVal; } | 197 bool anyTrue() const { return fVal; } |
| 198 SkNi thenElse(const SkNi& t, const SkNi& e) const { return fVal ? t : e; } | 198 SkNx thenElse(const SkNx& t, const SkNx& e) const { return fVal ? t : e; } |
| 199 | 199 |
| 200 protected: | 200 protected: |
| 201 T fVal; | 201 T fVal; |
| 202 }; | 202 }; |
| 203 | 203 |
| 204 template <> | 204 template <> |
| 205 class SkNf<1> { | 205 class SkNx<1,float> { |
| 206 public: | 206 public: |
| 207 SkNf() {} | 207 SkNx() {} |
| 208 SkNf(float val) : fVal(val) {} | 208 SkNx(float val) : fVal(val) {} |
| 209 static SkNf Load(const float vals[1]) { return SkNf(vals[0]); } | 209 static SkNx Load(const float vals[1]) { return SkNx(vals[0]); } |
| 210 static SkNf FromBytes(const uint8_t bytes[1]) { return SkNf((float)bytes[0])
; } | 210 static SkNx FromBytes(const uint8_t bytes[1]) { return SkNx((float)bytes[0])
; } |
| 211 | 211 |
| 212 void store(float vals[1]) const { vals[0] = fVal; } | 212 void store(float vals[1]) const { vals[0] = fVal; } |
| 213 void toBytes(uint8_t bytes[1]) const { bytes[0] = (uint8_t)(SkTMin(fVal, 255
.0f)); } | 213 void toBytes(uint8_t bytes[1]) const { bytes[0] = (uint8_t)(SkTMin(fVal, 255
.0f)); } |
| 214 | 214 |
| 215 SkNf operator + (const SkNf& o) const { return SkNf(fVal + o.fVal); } | 215 SkNx operator + (const SkNx& o) const { return SkNx(fVal + o.fVal); } |
| 216 SkNf operator - (const SkNf& o) const { return SkNf(fVal - o.fVal); } | 216 SkNx operator - (const SkNx& o) const { return SkNx(fVal - o.fVal); } |
| 217 SkNf operator * (const SkNf& o) const { return SkNf(fVal * o.fVal); } | 217 SkNx operator * (const SkNx& o) const { return SkNx(fVal * o.fVal); } |
| 218 SkNf operator / (const SkNf& o) const { return SkNf(fVal / o.fVal); } | 218 SkNx operator / (const SkNx& o) const { return SkNx(fVal / o.fVal); } |
| 219 | 219 |
| 220 SkNf operator == (const SkNf& o) const { return SkNf(fVal == o.fVal); } | 220 SkNx operator == (const SkNx& o) const { return SkNx(fVal == o.fVal); } |
| 221 SkNf operator != (const SkNf& o) const { return SkNf(fVal != o.fVal); } | 221 SkNx operator != (const SkNx& o) const { return SkNx(fVal != o.fVal); } |
| 222 SkNf operator < (const SkNf& o) const { return SkNf(fVal < o.fVal); } | 222 SkNx operator < (const SkNx& o) const { return SkNx(fVal < o.fVal); } |
| 223 SkNf operator > (const SkNf& o) const { return SkNf(fVal > o.fVal); } | 223 SkNx operator > (const SkNx& o) const { return SkNx(fVal > o.fVal); } |
| 224 SkNf operator <= (const SkNf& o) const { return SkNf(fVal <= o.fVal); } | 224 SkNx operator <= (const SkNx& o) const { return SkNx(fVal <= o.fVal); } |
| 225 SkNf operator >= (const SkNf& o) const { return SkNf(fVal >= o.fVal); } | 225 SkNx operator >= (const SkNx& o) const { return SkNx(fVal >= o.fVal); } |
| 226 | 226 |
| 227 static SkNf Min(const SkNf& l, const SkNf& r) { return SkNf(SkTMin(l.fVal, r
.fVal)); } | 227 static SkNx Min(const SkNx& l, const SkNx& r) { return SkNx(SkTMin(l.fVal, r
.fVal)); } |
| 228 static SkNf Max(const SkNf& l, const SkNf& r) { return SkNf(SkTMax(l.fVal, r
.fVal)); } | 228 static SkNx Max(const SkNx& l, const SkNx& r) { return SkNx(SkTMax(l.fVal, r
.fVal)); } |
| 229 | 229 |
| 230 SkNf sqrt() const { return SkNf(sqrtf(fVal)); } | 230 SkNx sqrt() const { return SkNx(sqrtf(fVal)); } |
| 231 SkNf rsqrt0() const { return SkNf(1.0f / sqrtf(fVal)); } | 231 SkNx rsqrt0() const { return SkNx(1.0f / sqrtf(fVal)); } |
| 232 SkNf rsqrt1() const { return this->rsqrt0(); } | 232 SkNx rsqrt1() const { return this->rsqrt0(); } |
| 233 SkNf rsqrt2() const { return this->rsqrt1(); } | 233 SkNx rsqrt2() const { return this->rsqrt1(); } |
| 234 | 234 |
| 235 SkNf invert() const { return SkNf(1.0f / fVal); } | 235 SkNx invert() const { return SkNx(1.0f / fVal); } |
| 236 SkNf approxInvert() const { return this->invert(); } | 236 SkNx approxInvert() const { return this->invert(); } |
| 237 | 237 |
| 238 template <int k> float kth() const { | 238 template <int k> float kth() const { |
| 239 SkASSERT(k == 0); | 239 SkASSERT(k == 0); |
| 240 return fVal; | 240 return fVal; |
| 241 } | 241 } |
| 242 | 242 |
| 243 bool allTrue() const { return this->pun() != 0; } | 243 bool allTrue() const { return this->pun() != 0; } |
| 244 bool anyTrue() const { return this->pun() != 0; } | 244 bool anyTrue() const { return this->pun() != 0; } |
| 245 SkNf thenElse(const SkNf& t, const SkNf& e) const { return this->pun() ? t :
e; } | 245 SkNx thenElse(const SkNx& t, const SkNx& e) const { return this->pun() ? t :
e; } |
| 246 | 246 |
| 247 protected: | 247 protected: |
| 248 uint32_t pun() const { | 248 uint32_t pun() const { |
| 249 union { float f; uint32_t i; } pun = { fVal }; | 249 union { float f; uint32_t i; } pun = { fVal }; |
| 250 return pun.i; | 250 return pun.i; |
| 251 } | 251 } |
| 252 | 252 |
| 253 float fVal; | 253 float fVal; |
| 254 }; | 254 }; |
| 255 | 255 |
| 256 // This default implementation can be specialized by ../opts/SkNx_foo.h | 256 // This default implementation can be specialized by ../opts/SkNx_foo.h |
| 257 // if there's a better platform-specific shuffle strategy. | 257 // if there's a better platform-specific shuffle strategy. |
| 258 template <typename SkNx, int... Ix> | 258 template <typename Nx, int... Ix> |
| 259 inline SkNx SkNx_shuffle_impl(const SkNx& src) { return SkNx( src.template kth<I
x>()... ); } | 259 inline Nx SkNx_shuffle_impl(const Nx& src) { return Nx( src.template kth<Ix>()..
. ); } |
| 260 | 260 |
| 261 // This generic shuffle can be called on either SkNi or SkNf with 1 or N indices
: | 261 // This generic shuffle can be called with 1 or N indices: |
| 262 // Sk4f f(a,b,c,d); | 262 // Sk4f f(a,b,c,d); |
| 263 // SkNx_shuffle<3>(f); // ~~~> Sk4f(d,d,d,d) | 263 // SkNx_shuffle<3>(f); // ~~~> Sk4f(d,d,d,d) |
| 264 // SkNx_shuffle<2,1,0,3>(f); // ~~~> Sk4f(c,b,a,d) | 264 // SkNx_shuffle<2,1,0,3>(f); // ~~~> Sk4f(c,b,a,d) |
| 265 template <int... Ix, typename SkNx> | 265 template <int... Ix, typename Nx> |
| 266 inline SkNx SkNx_shuffle(const SkNx& src) { return SkNx_shuffle_impl<SkNx, Ix...
>(src); } | 266 inline Nx SkNx_shuffle(const Nx& src) { return SkNx_shuffle_impl<Nx, Ix...>(src)
; } |
| 267 | 267 |
| 268 // A reminder alias that shuffles can be used to duplicate a single index across
a vector. | 268 // A reminder alias that shuffles can be used to duplicate a single index across
a vector. |
| 269 template <int Ix, typename SkNx> | 269 template <int Ix, typename Nx> |
| 270 inline SkNx SkNx_dup(const SkNx& src) { return SkNx_shuffle<Ix>(src); } | 270 inline Nx SkNx_dup(const Nx& src) { return SkNx_shuffle<Ix>(src); } |
| 271 |
| 272 // This is a poor-man's std::make_index_sequence from C++14. |
| 273 // I'd implement it fully, but it hurts my head. |
| 274 template <int...> struct SkIntSequence {}; |
| 275 template <int N> struct MakeSkIntSequence; |
| 276 template <> struct MakeSkIntSequence< 1> : SkIntSequence<0
>{}; |
| 277 template <> struct MakeSkIntSequence< 2> : SkIntSequence<0,1
>{}; |
| 278 template <> struct MakeSkIntSequence< 4> : SkIntSequence<0,1,2,3
>{}; |
| 279 template <> struct MakeSkIntSequence< 8> : SkIntSequence<0,1,2,3,4,5,6,7
>{}; |
| 280 template <> struct MakeSkIntSequence<16> : SkIntSequence<0,1,2,3,4,5,6,7,8,9,10,
11,12,13,14,15>{}; |
| 281 |
| 282 // This is the default/fallback implementation for SkNx_cast. Best to specializ
e SkNx_cast! |
| 283 template <typename D, typename S, int N, int... Ix> |
| 284 SkNx<N,D> SkNx_cast_fallback(const SkNx<N,S>& src, SkIntSequence<Ix...>) { |
| 285 return SkNx<N,D>( (D)src.template kth<Ix>()... ); |
| 286 } |
| 287 |
| 288 // This is a generic cast between two SkNx with the same number of elements N.
E.g. |
| 289 // Sk4b bs = ...; // Load 4 bytes. |
| 290 // Sk4f fs = SkNx_cast<float>(bs); // (This will replace SkNf::FromBytes() o
ne day.) |
| 291 // Sk4i is = SkNx_cast<int>(fs); // Cast each float to int. |
| 292 // This can be specialized in ../opts/SkNx_foo.h if there's a better platform-sp
ecific cast. |
| 293 template <typename D, typename S, int N> |
| 294 SkNx<N,D> SkNx_cast(const SkNx<N,S>& src) { |
| 295 return SkNx_cast_fallback<D,S,N>(src, MakeSkIntSequence<N>()); |
| 296 } |
| 271 | 297 |
| 272 } // namespace | 298 } // namespace |
| 273 | 299 |
| 274 | 300 |
| 275 // Include platform specific specializations if available. | 301 // Include platform specific specializations if available. |
| 276 #ifndef SKNX_NO_SIMD | 302 #ifndef SKNX_NO_SIMD |
| 277 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_AVX | 303 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_AVX |
| 278 #include "../opts/SkNx_avx.h" | 304 #include "../opts/SkNx_avx.h" |
| 279 #elif SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 | 305 #elif SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE2 |
| 280 #include "../opts/SkNx_sse.h" | 306 #include "../opts/SkNx_sse.h" |
| 281 #elif defined(SK_ARM_HAS_NEON) | 307 #elif defined(SK_ARM_HAS_NEON) |
| 282 #include "../opts/SkNx_neon.h" | 308 #include "../opts/SkNx_neon.h" |
| 283 #endif | 309 #endif |
| 284 #endif | 310 #endif |
| 285 | 311 |
| 286 #undef REQUIRE | 312 #undef REQUIRE |
| 287 | 313 |
| 288 typedef SkNf<2> Sk2f; | 314 typedef SkNx<2, float> Sk2f; |
| 289 typedef SkNf<2> Sk2s; | 315 typedef SkNx<2, float> Sk2s; |
| 290 typedef SkNf<4> Sk4f; | 316 typedef SkNx<4, float> Sk4f; |
| 291 typedef SkNf<4> Sk4s; | 317 typedef SkNx<4, float> Sk4s; |
| 292 typedef SkNf<8> Sk8f; | 318 typedef SkNx<8, float> Sk8f; |
| 293 typedef SkNf<8> Sk8s; | 319 typedef SkNx<8, float> Sk8s; |
| 294 | 320 |
| 295 typedef SkNi<8, uint16_t> Sk8h; | 321 typedef SkNx<8, uint16_t> Sk8h; |
| 296 typedef SkNi<16, uint16_t> Sk16h; | 322 typedef SkNx<16, uint16_t> Sk16h; |
| 297 typedef SkNi<16, uint8_t> Sk16b; | 323 typedef SkNx<16, uint8_t> Sk16b; |
| 324 |
| 325 typedef SkNx<4, int> Sk4i; |
| 298 | 326 |
| 299 #endif//SkNx_DEFINED | 327 #endif//SkNx_DEFINED |
| OLD | NEW |