| OLD | NEW |
| 1 /* | 1 /* |
| 2 * Copyright 2013 The Android Open Source Project | 2 * Copyright 2013 The Android Open Source Project |
| 3 * | 3 * |
| 4 * Use of this source code is governed by a BSD-style license that can be | 4 * Use of this source code is governed by a BSD-style license that can be |
| 5 * found in the LICENSE file. | 5 * found in the LICENSE file. |
| 6 */ | 6 */ |
| 7 | 7 |
| 8 | 8 #include <emmintrin.h> |
| 9 #include "SkBitmap.h" | 9 #include "SkBitmap.h" |
| 10 #include "SkBlurImage_opts_SSE2.h" |
| 10 #include "SkColorPriv.h" | 11 #include "SkColorPriv.h" |
| 11 #include "SkBlurImage_opts_SSE2.h" | |
| 12 #include "SkRect.h" | 12 #include "SkRect.h" |
| 13 | 13 |
| 14 #include <emmintrin.h> | |
| 15 | |
| 16 namespace { | 14 namespace { |
| 17 | |
| 18 enum BlurDirection { | 15 enum BlurDirection { |
| 19 kX, kY | 16 kX, kY |
| 20 }; | 17 }; |
| 21 | 18 |
| 22 /** | 19 /* Helper function to spread the components of a 32-bit integer into the |
| 23 * Helper function to spread the components of a 32-bit integer into the | |
| 24 * lower 8 bits of each 32-bit element of an SSE register. | 20 * lower 8 bits of each 32-bit element of an SSE register. |
| 25 */ | 21 */ |
| 22 inline __m128i expand(int a) { |
| 23 const __m128i zero = _mm_setzero_si128(); |
| 26 | 24 |
| 27 inline __m128i expand(int a) { | 25 // 0 0 0 0 0 0 0 0 0 0 0 0 A R G B |
| 28 const __m128i zero = _mm_setzero_si128(); | 26 __m128i result = _mm_cvtsi32_si128(a); |
| 29 | 27 |
| 30 // 0 0 0 0 0 0 0 0 0 0 0 0 A R G B | 28 // 0 0 0 0 0 0 0 0 0 A 0 R 0 G 0 B |
| 31 __m128i result = _mm_cvtsi32_si128(a); | 29 result = _mm_unpacklo_epi8(result, zero); |
| 32 | 30 |
| 33 // 0 0 0 0 0 0 0 0 0 A 0 R 0 G 0 B | 31 // 0 0 0 A 0 0 0 R 0 0 0 G 0 0 0 B |
| 34 result = _mm_unpacklo_epi8(result, zero); | 32 return _mm_unpacklo_epi16(result, zero); |
| 35 | |
| 36 // 0 0 0 A 0 0 0 R 0 0 0 G 0 0 0 B | |
| 37 return _mm_unpacklo_epi16(result, zero); | |
| 38 } | 33 } |
| 39 | 34 |
| 40 template<BlurDirection srcDirection, BlurDirection dstDirection> | 35 template<BlurDirection srcDirection, BlurDirection dstDirection> |
| 41 void SkBoxBlur_SSE2(const SkPMColor* src, int srcStride, SkPMColor* dst, int ker
nelSize, | 36 void SkBoxBlur_SSE2(const SkPMColor* src, int srcStride, SkPMColor* dst, int ker
nelSize, |
| 42 int leftOffset, int rightOffset, int width, int height) | 37 int leftOffset, int rightOffset, int width, int height) |
| 43 { | 38 { |
| 44 const int rightBorder = SkMin32(rightOffset + 1, width); | 39 const int rightBorder = SkMin32(rightOffset + 1, width); |
| 45 const int srcStrideX = srcDirection == kX ? 1 : srcStride; | 40 const int srcStrideX = srcDirection == kX ? 1 : srcStride; |
| 46 const int dstStrideX = dstDirection == kX ? 1 : height; | 41 const int dstStrideX = dstDirection == kX ? 1 : height; |
| 47 const int srcStrideY = srcDirection == kX ? srcStride : 1; | 42 const int srcStrideY = srcDirection == kX ? srcStride : 1; |
| (...skipping 60 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 108 bool SkBoxBlurGetPlatformProcs_SSE2(SkBoxBlurProc* boxBlurX, | 103 bool SkBoxBlurGetPlatformProcs_SSE2(SkBoxBlurProc* boxBlurX, |
| 109 SkBoxBlurProc* boxBlurY, | 104 SkBoxBlurProc* boxBlurY, |
| 110 SkBoxBlurProc* boxBlurXY, | 105 SkBoxBlurProc* boxBlurXY, |
| 111 SkBoxBlurProc* boxBlurYX) { | 106 SkBoxBlurProc* boxBlurYX) { |
| 112 *boxBlurX = SkBoxBlur_SSE2<kX, kX>; | 107 *boxBlurX = SkBoxBlur_SSE2<kX, kX>; |
| 113 *boxBlurY = SkBoxBlur_SSE2<kY, kY>; | 108 *boxBlurY = SkBoxBlur_SSE2<kY, kY>; |
| 114 *boxBlurXY = SkBoxBlur_SSE2<kX, kY>; | 109 *boxBlurXY = SkBoxBlur_SSE2<kX, kY>; |
| 115 *boxBlurYX = SkBoxBlur_SSE2<kY, kX>; | 110 *boxBlurYX = SkBoxBlur_SSE2<kY, kX>; |
| 116 return true; | 111 return true; |
| 117 } | 112 } |
| OLD | NEW |