Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(42)

Side by Side Diff: src/opts/SkPMFloat_sse.h

Issue 1286093004: Refactor to put SkXfermode_opts inside SK_OPTS_NS. (Closed) Base URL: https://skia.googlesource.com/skia.git@master
Patch Set: Created 5 years, 4 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « src/opts/SkPMFloat_none.h ('k') | src/opts/SkXfermode_opts.h » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 /* 1 /*
2 * Copyright 2015 Google Inc. 2 * Copyright 2015 Google Inc.
3 * 3 *
4 * Use of this source code is governed by a BSD-style license that can be 4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file. 5 * found in the LICENSE file.
6 */ 6 */
7 7
8 namespace { // See SkPMFloat.h 8 SK_ALWAYS_INLINE SkPMFloat::SkPMFloat(SkPMColor c) {
9
10 inline SkPMFloat::SkPMFloat(SkPMColor c) {
11 SkPMColorAssert(c); 9 SkPMColorAssert(c);
12 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3 10 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3
13 const int _ = 255; // Zero these bytes. 11 const int _ = 255; // Zero these bytes.
14 __m128i fix8 = _mm_cvtsi32_si128((int)c), 12 __m128i fix8 = _mm_cvtsi32_si128((int)c),
15 fix8_32 = _mm_shuffle_epi8(fix8, _mm_setr_epi8(0,_,_,_, 1,_,_,_, 2,_ ,_,_, 3,_,_,_)); 13 fix8_32 = _mm_shuffle_epi8(fix8, _mm_setr_epi8(0,_,_,_, 1,_,_,_, 2,_ ,_,_, 3,_,_,_));
16 #else 14 #else
17 __m128i fix8 = _mm_cvtsi32_si128((int)c), 15 __m128i fix8 = _mm_cvtsi32_si128((int)c),
18 fix8_16 = _mm_unpacklo_epi8 (fix8, _mm_setzero_si128()), 16 fix8_16 = _mm_unpacklo_epi8 (fix8, _mm_setzero_si128()),
19 fix8_32 = _mm_unpacklo_epi16(fix8_16, _mm_setzero_si128()); 17 fix8_32 = _mm_unpacklo_epi16(fix8_16, _mm_setzero_si128());
20 #endif 18 #endif
21 fVec = _mm_mul_ps(_mm_cvtepi32_ps(fix8_32), _mm_set1_ps(1.0f / 255)); 19 fVec = _mm_mul_ps(_mm_cvtepi32_ps(fix8_32), _mm_set1_ps(1.0f / 255));
22 SkASSERT(this->isValid()); 20 SkASSERT(this->isValid());
23 } 21 }
24 22
25 inline SkPMColor SkPMFloat::round() const { 23 SK_ALWAYS_INLINE SkPMColor SkPMFloat::round() const {
26 // We don't use _mm_cvtps_epi32, because we want precise control over how 0. 5 rounds (up). 24 // We don't use _mm_cvtps_epi32, because we want precise control over how 0. 5 rounds (up).
27 __m128 scaled = _mm_mul_ps(_mm_set1_ps(255), fVec); 25 __m128 scaled = _mm_mul_ps(_mm_set1_ps(255), fVec);
28 __m128i fix8_32 = _mm_cvttps_epi32(_mm_add_ps(_mm_set1_ps(0.5f), scaled)), 26 __m128i fix8_32 = _mm_cvttps_epi32(_mm_add_ps(_mm_set1_ps(0.5f), scaled)),
29 fix8_16 = _mm_packus_epi16(fix8_32, fix8_32), 27 fix8_16 = _mm_packus_epi16(fix8_32, fix8_32),
30 fix8 = _mm_packus_epi16(fix8_16, fix8_16); 28 fix8 = _mm_packus_epi16(fix8_16, fix8_16);
31 SkPMColor c = _mm_cvtsi128_si32(fix8); 29 SkPMColor c = _mm_cvtsi128_si32(fix8);
32 SkPMColorAssert(c); 30 SkPMColorAssert(c);
33 return c; 31 return c;
34 } 32 }
35 33
36 inline Sk4f SkPMFloat::alphas() const { 34 SK_ALWAYS_INLINE Sk4f SkPMFloat::alphas() const {
37 static_assert(SK_A32_SHIFT == 24, ""); 35 static_assert(SK_A32_SHIFT == 24, "");
38 return _mm_shuffle_ps(fVec, fVec, 0xff); // Read as 11 11 11 11, copying la ne 3 to all lanes. 36 return _mm_shuffle_ps(fVec, fVec, 0xff); // Read as 11 11 11 11, copying la ne 3 to all lanes.
39 } 37 }
40
41 } // namespace
OLDNEW
« no previous file with comments | « src/opts/SkPMFloat_none.h ('k') | src/opts/SkXfermode_opts.h » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698