Chromium Code Reviews| Index: src/opts/SkPMFloat_sse.h |
| diff --git a/src/opts/SkPMFloat_sse.h b/src/opts/SkPMFloat_sse.h |
| index 6cfee1da6fe8df4f24f6df23be921e8c20e55d17..6a4d5b6b5c1dbbfc9893223ba2ef17e05e9725bc 100644 |
| --- a/src/opts/SkPMFloat_sse.h |
| +++ b/src/opts/SkPMFloat_sse.h |
| @@ -38,15 +38,16 @@ inline Sk4f SkPMFloat::alphas() const { |
| return _mm_shuffle_ps(fVec, fVec, 0xff); // Read as 11 11 11 11, copying lane 3 to all lanes. |
| } |
| -inline SkPMFloat SkPMFloat::FromBGRx(SkColor c) { |
| +inline SkPMFloat SkPMFloat::FromOpaqueColor(SkColor c) { |
| + SkASSERT(SkColorGetA(c) == 0xFF); |
| __m128i fix8 = _mm_cvtsi32_si128((int)c); |
| #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3 |
| const char _ = ~0; // Zero these bytes. |
| __m128i fix8_32 = _mm_shuffle_epi8(fix8, |
| #if defined(SK_PMCOLOR_IS_BGRA) |
| - _mm_setr_epi8(0,_,_,_, 1,_,_,_, 2,_,_,_, _,_,_,_) |
| + _mm_setr_epi8(0,_,_,_, 1,_,_,_, 2,_,_,_, 3,_,_,_) |
| #else |
| - _mm_setr_epi8(2,_,_,_, 1,_,_,_, 0,_,_,_, _,_,_,_) |
| + _mm_setr_epi8(2,_,_,_, 1,_,_,_, 0,_,_,_, 3,_,_,_) |
| #endif |
| ); |
| #else |
| @@ -56,8 +57,6 @@ inline SkPMFloat SkPMFloat::FromBGRx(SkColor c) { |
| fix8_32 = _mm_shuffle_epi32(fix8_32, 0xC6); // C6 == 11 00 01 10, i.e swap lanes 0 and 2. |
| #endif |
| #endif |
| - fix8_32 = _mm_or_si128(fix8_32, _mm_set_epi32(0xFF,0,0,0)); // Force alpha to 1. |
|
Noel Gordon
2015/08/20 01:43:29
Very cool; less instructions generally means more
mtklein
2015/08/20 01:55:17
Yeah, _mm_set_ps doesn't really correspond to any
|
| - |
| SkPMFloat pmf = Sk4f(_mm_mul_ps(_mm_cvtepi32_ps(fix8_32), _mm_set1_ps(1.0f/255))); |
| SkASSERT(pmf.isValid()); |
| return pmf; |