OLD | NEW |
1 /* | 1 /* |
2 * Copyright 2015 Google Inc. | 2 * Copyright 2015 Google Inc. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license that can be | 4 * Use of this source code is governed by a BSD-style license that can be |
5 * found in the LICENSE file. | 5 * found in the LICENSE file. |
6 */ | 6 */ |
7 | 7 |
8 #ifndef SkNx_sse_DEFINED | 8 #ifndef SkNx_sse_DEFINED |
9 #define SkNx_sse_DEFINED | 9 #define SkNx_sse_DEFINED |
10 | 10 |
(...skipping 106 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
117 float operator[](int k) const { | 117 float operator[](int k) const { |
118 SkASSERT(0 <= k && k < 4); | 118 SkASSERT(0 <= k && k < 4); |
119 union { __m128 v; float fs[4]; } pun = {fVec}; | 119 union { __m128 v; float fs[4]; } pun = {fVec}; |
120 return pun.fs[k&3]; | 120 return pun.fs[k&3]; |
121 } | 121 } |
122 | 122 |
123 bool allTrue() const { return 0xffff == _mm_movemask_epi8(_mm_castps_si128(f
Vec)); } | 123 bool allTrue() const { return 0xffff == _mm_movemask_epi8(_mm_castps_si128(f
Vec)); } |
124 bool anyTrue() const { return 0x0000 != _mm_movemask_epi8(_mm_castps_si128(f
Vec)); } | 124 bool anyTrue() const { return 0x0000 != _mm_movemask_epi8(_mm_castps_si128(f
Vec)); } |
125 | 125 |
126 SkNx thenElse(const SkNx& t, const SkNx& e) const { | 126 SkNx thenElse(const SkNx& t, const SkNx& e) const { |
| 127 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSE41 |
| 128 return _mm_blendv_ps(e.fVec, t.fVec, fVec); |
| 129 #else |
127 return _mm_or_ps(_mm_and_ps (fVec, t.fVec), | 130 return _mm_or_ps(_mm_and_ps (fVec, t.fVec), |
128 _mm_andnot_ps(fVec, e.fVec)); | 131 _mm_andnot_ps(fVec, e.fVec)); |
| 132 #endif |
129 } | 133 } |
130 | 134 |
131 __m128 fVec; | 135 __m128 fVec; |
132 }; | 136 }; |
133 | 137 |
134 template <> | 138 template <> |
135 class SkNx<4, int> { | 139 class SkNx<4, int> { |
136 public: | 140 public: |
137 SkNx(const __m128i& vec) : fVec(vec) {} | 141 SkNx(const __m128i& vec) : fVec(vec) {} |
138 | 142 |
(...skipping 228 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
367 | 371 |
368 template<> /*static*/ inline Sk4h SkNx_cast<uint16_t, uint8_t>(const Sk4b& src)
{ | 372 template<> /*static*/ inline Sk4h SkNx_cast<uint16_t, uint8_t>(const Sk4b& src)
{ |
369 return _mm_unpacklo_epi8(src.fVec, _mm_setzero_si128()); | 373 return _mm_unpacklo_epi8(src.fVec, _mm_setzero_si128()); |
370 } | 374 } |
371 | 375 |
372 template<> /*static*/ inline Sk4b SkNx_cast<uint8_t, uint16_t>(const Sk4h& src)
{ | 376 template<> /*static*/ inline Sk4b SkNx_cast<uint8_t, uint16_t>(const Sk4h& src)
{ |
373 return _mm_packus_epi16(src.fVec, src.fVec); | 377 return _mm_packus_epi16(src.fVec, src.fVec); |
374 } | 378 } |
375 | 379 |
376 #endif//SkNx_sse_DEFINED | 380 #endif//SkNx_sse_DEFINED |
OLD | NEW |