OLD | NEW |
---|---|
1 /* | 1 /* |
2 * Copyright 2012 The Android Open Source Project | 2 * Copyright 2012 The Android Open Source Project |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license that can be | 4 * Use of this source code is governed by a BSD-style license that can be |
5 * found in the LICENSE file. | 5 * found in the LICENSE file. |
6 */ | 6 */ |
7 | 7 |
8 #include "SkBitmapProcState_opts_SSSE3.h" | 8 #include "SkBitmapProcState_opts_SSSE3.h" |
9 #include "SkColorPriv.h" | |
9 #include "SkPaint.h" | 10 #include "SkPaint.h" |
10 #include "SkUtils.h" | 11 #include "SkUtils.h" |
11 | 12 |
12 /* With the exception of the compilers that don't support it, we always build th e | 13 /* With the exception of the compilers that don't support it, we always build th e |
13 * SSSE3 functions and enable the caller to determine SSSE3 support. However fo r | 14 * SSSE3 functions and enable the caller to determine SSSE3 support. However fo r |
14 * compilers that do not support SSSE3 we provide a stub implementation. | 15 * compilers that do not support SSSE3 we provide a stub implementation. |
15 */ | 16 */ |
16 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3 | 17 #if SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3 |
17 | 18 |
18 #include <tmmintrin.h> // SSSE3 | 19 #include <tmmintrin.h> // SSSE3 |
(...skipping 694 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
713 S32_generic_D32_filter_DX_SSSE3<false>(s, xy, count, colors); | 714 S32_generic_D32_filter_DX_SSSE3<false>(s, xy, count, colors); |
714 } | 715 } |
715 | 716 |
716 void S32_alpha_D32_filter_DX_SSSE3(const SkBitmapProcState& s, | 717 void S32_alpha_D32_filter_DX_SSSE3(const SkBitmapProcState& s, |
717 const uint32_t* xy, | 718 const uint32_t* xy, |
718 int count, uint32_t* colors) { | 719 int count, uint32_t* colors) { |
719 S32_generic_D32_filter_DX_SSSE3<true>(s, xy, count, colors); | 720 S32_generic_D32_filter_DX_SSSE3<true>(s, xy, count, colors); |
720 } | 721 } |
721 | 722 |
722 void S32_opaque_D32_filter_DXDY_SSSE3(const SkBitmapProcState& s, | 723 void S32_opaque_D32_filter_DXDY_SSSE3(const SkBitmapProcState& s, |
723 const uint32_t* xy, | 724 const uint32_t* xy, |
724 int count, uint32_t* colors) { | 725 int count, uint32_t* colors) { |
725 S32_generic_D32_filter_DXDY_SSSE3<false>(s, xy, count, colors); | 726 S32_generic_D32_filter_DXDY_SSSE3<false>(s, xy, count, colors); |
726 } | 727 } |
727 | 728 |
728 void S32_alpha_D32_filter_DXDY_SSSE3(const SkBitmapProcState& s, | 729 void S32_alpha_D32_filter_DXDY_SSSE3(const SkBitmapProcState& s, |
729 const uint32_t* xy, | 730 const uint32_t* xy, |
730 int count, uint32_t* colors) { | 731 int count, uint32_t* colors) { |
731 S32_generic_D32_filter_DXDY_SSSE3<true>(s, xy, count, colors); | 732 S32_generic_D32_filter_DXDY_SSSE3<true>(s, xy, count, colors); |
732 } | 733 } |
733 | 734 |
735 void S32_D16_filter_DXDY_SSSE3(const SkBitmapProcState& s, | |
736 const uint32_t* xy, | |
737 int count, uint16_t* colors) { | |
738 SkAutoTMalloc<uint32_t> colors32(count); | |
qiankun
2014/12/02 10:51:41
If "uint32_t colors32[128];" used here, it's more
mtklein
2014/12/02 15:19:05
Might be worth trying SkAutoSTMalloc<64, uint32_t>
qiankun1
2014/12/02 15:58:43
Done. Where is these performance improvement from?
mtklein
2014/12/02 16:52:22
Right, just heap vs. stack. There's no difference
| |
739 S32_generic_D32_filter_DXDY_SSSE3<false>(s, xy, count, colors32); | |
740 for(int i = 0; i < count; i++) { | |
741 *colors++ = SkPixel32ToPixel16(colors32[i]); | |
742 } | |
743 } | |
744 | |
734 #else // SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3 | 745 #else // SK_CPU_SSE_LEVEL >= SK_CPU_SSE_LEVEL_SSSE3 |
735 | 746 |
736 void S32_opaque_D32_filter_DX_SSSE3(const SkBitmapProcState& s, | 747 void S32_opaque_D32_filter_DX_SSSE3(const SkBitmapProcState& s, |
737 const uint32_t* xy, | 748 const uint32_t* xy, |
738 int count, uint32_t* colors) { | 749 int count, uint32_t* colors) { |
739 sk_throw(); | 750 sk_throw(); |
740 } | 751 } |
741 | 752 |
742 void S32_alpha_D32_filter_DX_SSSE3(const SkBitmapProcState& s, | 753 void S32_alpha_D32_filter_DX_SSSE3(const SkBitmapProcState& s, |
743 const uint32_t* xy, | 754 const uint32_t* xy, |
744 int count, uint32_t* colors) { | 755 int count, uint32_t* colors) { |
745 sk_throw(); | 756 sk_throw(); |
746 } | 757 } |
747 | 758 |
748 void S32_opaque_D32_filter_DXDY_SSSE3(const SkBitmapProcState& s, | 759 void S32_opaque_D32_filter_DXDY_SSSE3(const SkBitmapProcState& s, |
749 const uint32_t* xy, | 760 const uint32_t* xy, |
750 int count, uint32_t* colors) { | 761 int count, uint32_t* colors) { |
751 sk_throw(); | 762 sk_throw(); |
752 } | 763 } |
753 | 764 |
754 void S32_alpha_D32_filter_DXDY_SSSE3(const SkBitmapProcState& s, | 765 void S32_alpha_D32_filter_DXDY_SSSE3(const SkBitmapProcState& s, |
755 const uint32_t* xy, | 766 const uint32_t* xy, |
756 int count, uint32_t* colors) { | 767 int count, uint32_t* colors) { |
757 sk_throw(); | 768 sk_throw(); |
758 } | 769 } |
759 | 770 |
771 void S32_D16_filter_DXDY_SSSE3(const SkBitmapProcState& s, | |
772 const uint32_t* xy, | |
773 int count, uint32_t* colors) { | |
774 sk_throw(); | |
775 } | |
776 | |
760 #endif | 777 #endif |
OLD | NEW |