src/opts/SkColor_opts_SSE2.h - Issue 724333003: Optimize SkAlphaMulQ_SSE2

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: src/opts/SkColor_opts_SSE2.h

Issue 724333003: Optimize SkAlphaMulQ_SSE2 (Closed) Base URL: https://skia.googlesource.com/skia.git@master

Patch Set: add assert Created 6 years, 1 month ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

Index: src/opts/SkColor_opts_SSE2.h

diff --git a/src/opts/SkColor_opts_SSE2.h b/src/opts/SkColor_opts_SSE2.h

index 7e61d526b3bf4427462b59e407187d32fb52bcd6..08cde8e009eee2cfe18a017ed872e2084b93b1f2 100644

--- a/src/opts/SkColor_opts_SSE2.h

+++ b/src/opts/SkColor_opts_SSE2.h

@@ -10,6 +10,8 @@

#include <emmintrin.h>

+#define ASSERT_EQ(a,b) SkASSERT(0xffff == _mm_movemask_epi8(_mm_cmpeq_epi8((a), (b))))

// Because no _mm_mul_epi32() in SSE2, we emulate it here.

// Multiplies 4 32-bit integers from a by 4 32-bit intergers from b.

// The 4 multiplication results should be represented within 32-bit

@@ -52,11 +54,11 @@ static inline __m128i SkAlphaMulQ_SSE2(const __m128i& c, const __m128i& scale) {

// uint32_t ag = ((c >> 8) & mask) * scale

__m128i ag = _mm_srli_epi16(c, 8);

- ag = _mm_and_si128(ag, mask);

+ ASSERT_EQ(ag, _mm_and_si128(mask, ag)); // ag = _mm_srli_epi16(c, 8) did this for us.

ag = _mm_mullo_epi16(ag, s);

// (rb & mask) | (ag & ~mask)

- rb = _mm_and_si128(mask, rb);

+ ASSERT_EQ(rb, _mm_and_si128(mask, rb)); // rb = _mm_srli_epi16(rb, 8) did this for us.

ag = _mm_andnot_si128(mask, ag);

return _mm_or_si128(rb, ag);

}

« no previous file with comments | « no previous file | no next file » | no next file with comments »