src/opts/SkPMFloat_sse.h - Issue 1294213002: Remove SkOpts_sse2.cpp.

Side by Side Diff

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Side by Side Diff: src/opts/SkPMFloat_sse.h

Issue 1294213002: Remove SkOpts_sse2.cpp. (Closed) Base URL: https://skia.googlesource.com/skia.git@master

Patch Set: char ~0 Created 5 years, 4 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch

« no previous file with comments | « src/opts/SkOpts_ssse3.cpp ('k') | no next file » | no next file with comments »

OLD	NEW
1 /*	1 /*

2 * Copyright 2015 Google Inc.	2 * Copyright 2015 Google Inc.

3 *	3 *

4 * Use of this source code is governed by a BSD-style license that can be	4 * Use of this source code is governed by a BSD-style license that can be

5 * found in the LICENSE file.	5 * found in the LICENSE file.

6 */	6 */

7	7

8 namespace { // See SkPMFloat.h	8 namespace { // See SkPMFloat.h

9	9

10 inline SkPMFloat::SkPMFloat(SkPMColor c) {	10 inline SkPMFloat::SkPMFloat(SkPMColor c) {

11 SkPMColorAssert(c);	11 SkPMColorAssert(c);

12 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3	12 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3

13 const int _ = 255; // Zero these bytes.	13 const char _ = ~0; // Zero these bytes.

14 __m128i fix8 = _mm_cvtsi32_si128((int)c),	14 __m128i fix8 = _mm_cvtsi32_si128((int)c),

15 fix8_32 = _mm_shuffle_epi8(fix8, _mm_setr_epi8(0,_,_,_, 1,_,_,_, 2,_ ,_,_, 3,_,_,_));	15 fix8_32 = _mm_shuffle_epi8(fix8, _mm_setr_epi8(0,_,_,_, 1,_,_,_, 2,_ ,_,_, 3,_,_,_));

16 #else	16 #else

17 __m128i fix8 = _mm_cvtsi32_si128((int)c),	17 __m128i fix8 = _mm_cvtsi32_si128((int)c),

18 fix8_16 = _mm_unpacklo_epi8 (fix8, _mm_setzero_si128()),	18 fix8_16 = _mm_unpacklo_epi8 (fix8, _mm_setzero_si128()),

19 fix8_32 = _mm_unpacklo_epi16(fix8_16, _mm_setzero_si128());	19 fix8_32 = _mm_unpacklo_epi16(fix8_16, _mm_setzero_si128());

20 #endif	20 #endif

21 fVec = _mm_mul_ps(_mm_cvtepi32_ps(fix8_32), _mm_set1_ps(1.0f / 255));	21 fVec = _mm_mul_ps(_mm_cvtepi32_ps(fix8_32), _mm_set1_ps(1.0f / 255));

22 SkASSERT(this->isValid());	22 SkASSERT(this->isValid());

23 }	23 }

24	24

25 inline SkPMColor SkPMFloat::round() const {	25 inline SkPMColor SkPMFloat::round() const {

26 // We don't use _mm_cvtps_epi32, because we want precise control over how 0. 5 rounds (up).	26 // We don't use _mm_cvtps_epi32, because we want precise control over how 0. 5 rounds (up).

27 __m128 scaled = _mm_mul_ps(_mm_set1_ps(255), fVec);	27 __m128 scaled = _mm_mul_ps(_mm_set1_ps(255), fVec);

28 __m128i fix8_32 = _mm_cvttps_epi32(_mm_add_ps(_mm_set1_ps(0.5f), scaled)),	28 __m128i fix8_32 = _mm_cvttps_epi32(_mm_add_ps(_mm_set1_ps(0.5f), scaled)),

29 fix8_16 = _mm_packus_epi16(fix8_32, fix8_32),	29 fix8_16 = _mm_packus_epi16(fix8_32, fix8_32),

30 fix8 = _mm_packus_epi16(fix8_16, fix8_16);	30 fix8 = _mm_packus_epi16(fix8_16, fix8_16);

31 SkPMColor c = _mm_cvtsi128_si32(fix8);	31 SkPMColor c = _mm_cvtsi128_si32(fix8);

32 SkPMColorAssert(c);	32 SkPMColorAssert(c);

33 return c;	33 return c;

34 }	34 }

35	35

36 inline Sk4f SkPMFloat::alphas() const {	36 inline Sk4f SkPMFloat::alphas() const {

37 static_assert(SK_A32_SHIFT == 24, "");	37 static_assert(SK_A32_SHIFT == 24, "");

38 return _mm_shuffle_ps(fVec, fVec, 0xff); // Read as 11 11 11 11, copying la ne 3 to all lanes.	38 return _mm_shuffle_ps(fVec, fVec, 0xff); // Read as 11 11 11 11, copying la ne 3 to all lanes.

39 }	39 }

40	40

41 } // namespace	41 } // namespace

OLD	NEW