src/opts/SkPMFloat_sse.h - Issue 1286093004: Refactor to put SkXfermode_opts inside SK_OPTS_NS.

Side by Side Diff

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Side by Side Diff: src/opts/SkPMFloat_sse.h

Issue 1286093004: Refactor to put SkXfermode_opts inside SK_OPTS_NS. (Closed) Base URL: https://skia.googlesource.com/skia.git@master

Patch Set: Created 5 years, 4 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

OLD	NEW
1 /*	1 /*

2 * Copyright 2015 Google Inc.	2 * Copyright 2015 Google Inc.

3 *	3 *

4 * Use of this source code is governed by a BSD-style license that can be	4 * Use of this source code is governed by a BSD-style license that can be

5 * found in the LICENSE file.	5 * found in the LICENSE file.

6 */	6 */

7	7

8 namespace { // See SkPMFloat.h	8 SK_ALWAYS_INLINE SkPMFloat::SkPMFloat(SkPMColor c) {

9

10 inline SkPMFloat::SkPMFloat(SkPMColor c) {

11 SkPMColorAssert(c);	9 SkPMColorAssert(c);

12 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3	10 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3

13 const int _ = 255; // Zero these bytes.	11 const int _ = 255; // Zero these bytes.

14 __m128i fix8 = _mm_cvtsi32_si128((int)c),	12 __m128i fix8 = _mm_cvtsi32_si128((int)c),

15 fix8_32 = _mm_shuffle_epi8(fix8, _mm_setr_epi8(0,_,_,_, 1,_,_,_, 2,_ ,_,_, 3,_,_,_));	13 fix8_32 = _mm_shuffle_epi8(fix8, _mm_setr_epi8(0,_,_,_, 1,_,_,_, 2,_ ,_,_, 3,_,_,_));

16 #else	14 #else

17 __m128i fix8 = _mm_cvtsi32_si128((int)c),	15 __m128i fix8 = _mm_cvtsi32_si128((int)c),

18 fix8_16 = _mm_unpacklo_epi8 (fix8, _mm_setzero_si128()),	16 fix8_16 = _mm_unpacklo_epi8 (fix8, _mm_setzero_si128()),

19 fix8_32 = _mm_unpacklo_epi16(fix8_16, _mm_setzero_si128());	17 fix8_32 = _mm_unpacklo_epi16(fix8_16, _mm_setzero_si128());

20 #endif	18 #endif

21 fVec = _mm_mul_ps(_mm_cvtepi32_ps(fix8_32), _mm_set1_ps(1.0f / 255));	19 fVec = _mm_mul_ps(_mm_cvtepi32_ps(fix8_32), _mm_set1_ps(1.0f / 255));

22 SkASSERT(this->isValid());	20 SkASSERT(this->isValid());

23 }	21 }

24	22

25 inline SkPMColor SkPMFloat::round() const {	23 SK_ALWAYS_INLINE SkPMColor SkPMFloat::round() const {

26 // We don't use _mm_cvtps_epi32, because we want precise control over how 0. 5 rounds (up).	24 // We don't use _mm_cvtps_epi32, because we want precise control over how 0. 5 rounds (up).

27 __m128 scaled = _mm_mul_ps(_mm_set1_ps(255), fVec);	25 __m128 scaled = _mm_mul_ps(_mm_set1_ps(255), fVec);

28 __m128i fix8_32 = _mm_cvttps_epi32(_mm_add_ps(_mm_set1_ps(0.5f), scaled)),	26 __m128i fix8_32 = _mm_cvttps_epi32(_mm_add_ps(_mm_set1_ps(0.5f), scaled)),

29 fix8_16 = _mm_packus_epi16(fix8_32, fix8_32),	27 fix8_16 = _mm_packus_epi16(fix8_32, fix8_32),

30 fix8 = _mm_packus_epi16(fix8_16, fix8_16);	28 fix8 = _mm_packus_epi16(fix8_16, fix8_16);

31 SkPMColor c = _mm_cvtsi128_si32(fix8);	29 SkPMColor c = _mm_cvtsi128_si32(fix8);

32 SkPMColorAssert(c);	30 SkPMColorAssert(c);

33 return c;	31 return c;

34 }	32 }

35	33

36 inline Sk4f SkPMFloat::alphas() const {	34 SK_ALWAYS_INLINE Sk4f SkPMFloat::alphas() const {

37 static_assert(SK_A32_SHIFT == 24, "");	35 static_assert(SK_A32_SHIFT == 24, "");

38 return _mm_shuffle_ps(fVec, fVec, 0xff); // Read as 11 11 11 11, copying la ne 3 to all lanes.	36 return _mm_shuffle_ps(fVec, fVec, 0xff); // Read as 11 11 11 11, copying la ne 3 to all lanes.

39 }	37 }

40

41 } // namespace

OLD	NEW

« no previous file with comments | « src/opts/SkPMFloat_none.h ('k') | src/opts/SkXfermode_opts.h » ('j') | no next file with comments »