| OLD | NEW |
| 1 /* | 1 /* |
| 2 * Copyright 2015 Google Inc. | 2 * Copyright 2015 Google Inc. |
| 3 * | 3 * |
| 4 * Use of this source code is governed by a BSD-style license that can be | 4 * Use of this source code is governed by a BSD-style license that can be |
| 5 * found in the LICENSE file. | 5 * found in the LICENSE file. |
| 6 */ | 6 */ |
| 7 | 7 |
| 8 #ifndef SkNx_sse_DEFINED | 8 #ifndef SkNx_sse_DEFINED |
| 9 #define SkNx_sse_DEFINED | 9 #define SkNx_sse_DEFINED |
| 10 | 10 |
| (...skipping 64 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 75 Nb operator != (const SkNf& o) const { return _mm_castps_si128(_mm_cmpneq_ps
(fVec, o.fVec)); } | 75 Nb operator != (const SkNf& o) const { return _mm_castps_si128(_mm_cmpneq_ps
(fVec, o.fVec)); } |
| 76 Nb operator < (const SkNf& o) const { return _mm_castps_si128(_mm_cmplt_ps
(fVec, o.fVec)); } | 76 Nb operator < (const SkNf& o) const { return _mm_castps_si128(_mm_cmplt_ps
(fVec, o.fVec)); } |
| 77 Nb operator > (const SkNf& o) const { return _mm_castps_si128(_mm_cmpgt_ps
(fVec, o.fVec)); } | 77 Nb operator > (const SkNf& o) const { return _mm_castps_si128(_mm_cmpgt_ps
(fVec, o.fVec)); } |
| 78 Nb operator <= (const SkNf& o) const { return _mm_castps_si128(_mm_cmple_ps
(fVec, o.fVec)); } | 78 Nb operator <= (const SkNf& o) const { return _mm_castps_si128(_mm_cmple_ps
(fVec, o.fVec)); } |
| 79 Nb operator >= (const SkNf& o) const { return _mm_castps_si128(_mm_cmpge_ps
(fVec, o.fVec)); } | 79 Nb operator >= (const SkNf& o) const { return _mm_castps_si128(_mm_cmpge_ps
(fVec, o.fVec)); } |
| 80 | 80 |
| 81 static SkNf Min(const SkNf& l, const SkNf& r) { return _mm_min_ps(l.fVec, r.
fVec); } | 81 static SkNf Min(const SkNf& l, const SkNf& r) { return _mm_min_ps(l.fVec, r.
fVec); } |
| 82 static SkNf Max(const SkNf& l, const SkNf& r) { return _mm_max_ps(l.fVec, r.
fVec); } | 82 static SkNf Max(const SkNf& l, const SkNf& r) { return _mm_max_ps(l.fVec, r.
fVec); } |
| 83 | 83 |
| 84 SkNf sqrt() const { return _mm_sqrt_ps (fVec); } | 84 SkNf sqrt() const { return _mm_sqrt_ps (fVec); } |
| 85 SkNf rsqrt0() const { return _mm_rsqrt_ps(fVec); } | 85 SkNf rsqrt() const { return _mm_rsqrt_ps(fVec); } |
| 86 SkNf rsqrt1() const { return this->rsqrt0(); } | |
| 87 SkNf rsqrt2() const { return this->rsqrt1(); } | |
| 88 | 86 |
| 89 SkNf invert() const { return SkNf(1) / *this; } | 87 SkNf invert() const { return SkNf(1) / *this; } |
| 90 SkNf approxInvert() const { return _mm_rcp_ps(fVec); } | 88 SkNf approxInvert() const { return _mm_rcp_ps(fVec); } |
| 91 | 89 |
| 92 template <int k> float kth() const { | 90 template <int k> float kth() const { |
| 93 SkASSERT(0 <= k && k < 2); | 91 SkASSERT(0 <= k && k < 2); |
| 94 union { __m128 v; float fs[4]; } pun = {fVec}; | 92 union { __m128 v; float fs[4]; } pun = {fVec}; |
| 95 return pun.fs[k&1]; | 93 return pun.fs[k&1]; |
| 96 } | 94 } |
| 97 | 95 |
| (...skipping 23 matching lines...) Expand all Loading... |
| 121 Nb operator != (const SkNf& o) const { return _mm_castpd_si128(_mm_cmpneq_pd
(fVec, o.fVec)); } | 119 Nb operator != (const SkNf& o) const { return _mm_castpd_si128(_mm_cmpneq_pd
(fVec, o.fVec)); } |
| 122 Nb operator < (const SkNf& o) const { return _mm_castpd_si128(_mm_cmplt_pd
(fVec, o.fVec)); } | 120 Nb operator < (const SkNf& o) const { return _mm_castpd_si128(_mm_cmplt_pd
(fVec, o.fVec)); } |
| 123 Nb operator > (const SkNf& o) const { return _mm_castpd_si128(_mm_cmpgt_pd
(fVec, o.fVec)); } | 121 Nb operator > (const SkNf& o) const { return _mm_castpd_si128(_mm_cmpgt_pd
(fVec, o.fVec)); } |
| 124 Nb operator <= (const SkNf& o) const { return _mm_castpd_si128(_mm_cmple_pd
(fVec, o.fVec)); } | 122 Nb operator <= (const SkNf& o) const { return _mm_castpd_si128(_mm_cmple_pd
(fVec, o.fVec)); } |
| 125 Nb operator >= (const SkNf& o) const { return _mm_castpd_si128(_mm_cmpge_pd
(fVec, o.fVec)); } | 123 Nb operator >= (const SkNf& o) const { return _mm_castpd_si128(_mm_cmpge_pd
(fVec, o.fVec)); } |
| 126 | 124 |
| 127 static SkNf Min(const SkNf& l, const SkNf& r) { return _mm_min_pd(l.fVec, r.
fVec); } | 125 static SkNf Min(const SkNf& l, const SkNf& r) { return _mm_min_pd(l.fVec, r.
fVec); } |
| 128 static SkNf Max(const SkNf& l, const SkNf& r) { return _mm_max_pd(l.fVec, r.
fVec); } | 126 static SkNf Max(const SkNf& l, const SkNf& r) { return _mm_max_pd(l.fVec, r.
fVec); } |
| 129 | 127 |
| 130 SkNf sqrt() const { return _mm_sqrt_pd(fVec); } | 128 SkNf sqrt() const { return _mm_sqrt_pd(fVec); } |
| 131 SkNf rsqrt0() const { return _mm_cvtps_pd(_mm_rsqrt_ps(_mm_cvtpd_ps(fVec)));
} | 129 SkNf rsqrt() const { return _mm_cvtps_pd(_mm_rsqrt_ps(_mm_cvtpd_ps(fVec)));
} |
| 132 SkNf rsqrt1() const { return this->rsqrt0(); } | |
| 133 SkNf rsqrt2() const { return this->rsqrt1(); } | |
| 134 | 130 |
| 135 SkNf invert() const { return SkNf(1) / *this; } | 131 SkNf invert() const { return SkNf(1) / *this; } |
| 136 SkNf approxInvert() const { return _mm_cvtps_pd(_mm_rcp_ps(_mm_cvtpd_ps(fVec
))); } | 132 SkNf approxInvert() const { return _mm_cvtps_pd(_mm_rcp_ps(_mm_cvtpd_ps(fVec
))); } |
| 137 | 133 |
| 138 template <int k> double kth() const { | 134 template <int k> double kth() const { |
| 139 SkASSERT(0 <= k && k < 2); | 135 SkASSERT(0 <= k && k < 2); |
| 140 union { __m128d v; double ds[2]; } pun = {fVec}; | 136 union { __m128d v; double ds[2]; } pun = {fVec}; |
| 141 return pun.ds[k&1]; | 137 return pun.ds[k&1]; |
| 142 } | 138 } |
| 143 | 139 |
| (...skipping 63 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 207 Nb operator != (const SkNf& o) const { return _mm_castps_si128(_mm_cmpneq_ps
(fVec, o.fVec)); } | 203 Nb operator != (const SkNf& o) const { return _mm_castps_si128(_mm_cmpneq_ps
(fVec, o.fVec)); } |
| 208 Nb operator < (const SkNf& o) const { return _mm_castps_si128(_mm_cmplt_ps
(fVec, o.fVec)); } | 204 Nb operator < (const SkNf& o) const { return _mm_castps_si128(_mm_cmplt_ps
(fVec, o.fVec)); } |
| 209 Nb operator > (const SkNf& o) const { return _mm_castps_si128(_mm_cmpgt_ps
(fVec, o.fVec)); } | 205 Nb operator > (const SkNf& o) const { return _mm_castps_si128(_mm_cmpgt_ps
(fVec, o.fVec)); } |
| 210 Nb operator <= (const SkNf& o) const { return _mm_castps_si128(_mm_cmple_ps
(fVec, o.fVec)); } | 206 Nb operator <= (const SkNf& o) const { return _mm_castps_si128(_mm_cmple_ps
(fVec, o.fVec)); } |
| 211 Nb operator >= (const SkNf& o) const { return _mm_castps_si128(_mm_cmpge_ps
(fVec, o.fVec)); } | 207 Nb operator >= (const SkNf& o) const { return _mm_castps_si128(_mm_cmpge_ps
(fVec, o.fVec)); } |
| 212 | 208 |
| 213 static SkNf Min(const SkNf& l, const SkNf& r) { return _mm_min_ps(l.fVec, r.
fVec); } | 209 static SkNf Min(const SkNf& l, const SkNf& r) { return _mm_min_ps(l.fVec, r.
fVec); } |
| 214 static SkNf Max(const SkNf& l, const SkNf& r) { return _mm_max_ps(l.fVec, r.
fVec); } | 210 static SkNf Max(const SkNf& l, const SkNf& r) { return _mm_max_ps(l.fVec, r.
fVec); } |
| 215 | 211 |
| 216 SkNf sqrt() const { return _mm_sqrt_ps (fVec); } | 212 SkNf sqrt() const { return _mm_sqrt_ps (fVec); } |
| 217 SkNf rsqrt0() const { return _mm_rsqrt_ps(fVec); } | 213 SkNf rsqrt() const { return _mm_rsqrt_ps(fVec); } |
| 218 SkNf rsqrt1() const { return this->rsqrt0(); } | |
| 219 SkNf rsqrt2() const { return this->rsqrt1(); } | |
| 220 | 214 |
| 221 SkNf invert() const { return SkNf(1) / *this; } | 215 SkNf invert() const { return SkNf(1) / *this; } |
| 222 SkNf approxInvert() const { return _mm_rcp_ps(fVec); } | 216 SkNf approxInvert() const { return _mm_rcp_ps(fVec); } |
| 223 | 217 |
| 224 template <int k> float kth() const { | 218 template <int k> float kth() const { |
| 225 SkASSERT(0 <= k && k < 4); | 219 SkASSERT(0 <= k && k < 4); |
| 226 union { __m128 v; float fs[4]; } pun = {fVec}; | 220 union { __m128 v; float fs[4]; } pun = {fVec}; |
| 227 return pun.fs[k&3]; | 221 return pun.fs[k&3]; |
| 228 } | 222 } |
| 229 | 223 |
| (...skipping 50 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 280 | 274 |
| 281 template <int k> uint16_t kth() const { | 275 template <int k> uint16_t kth() const { |
| 282 SkASSERT(0 <= k && k < 8); | 276 SkASSERT(0 <= k && k < 8); |
| 283 return _mm_extract_epi16(fVec, k); | 277 return _mm_extract_epi16(fVec, k); |
| 284 } | 278 } |
| 285 protected: | 279 protected: |
| 286 __m128i fVec; | 280 __m128i fVec; |
| 287 }; | 281 }; |
| 288 | 282 |
| 289 #endif//SkNx_sse_DEFINED | 283 #endif//SkNx_sse_DEFINED |
| OLD | NEW |