OLD | NEW |
1 /* | 1 /* |
2 * Copyright 2012 The LibYuv Project Authors. All rights reserved. | 2 * Copyright 2012 The LibYuv Project Authors. All rights reserved. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license | 4 * Use of this source code is governed by a BSD-style license |
5 * that can be found in the LICENSE file in the root of the source | 5 * that can be found in the LICENSE file in the root of the source |
6 * tree. An additional intellectual property rights grant can be found | 6 * tree. An additional intellectual property rights grant can be found |
7 * in the file PATENTS. All contributing project authors may | 7 * in the file PATENTS. All contributing project authors may |
8 * be found in the AUTHORS file in the root of the source tree. | 8 * be found in the AUTHORS file in the root of the source tree. |
9 */ | 9 */ |
10 | 10 |
(...skipping 109 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
120 } \ | 120 } \ |
121 ANY_SIMD(temp, temp + 64, temp + 128, temp + 192, \ | 121 ANY_SIMD(temp, temp + 64, temp + 128, temp + 192, \ |
122 yuvconstants, MASK + 1); \ | 122 yuvconstants, MASK + 1); \ |
123 memcpy(dst_ptr + (n >> DUVSHIFT) * BPP, temp + 192, \ | 123 memcpy(dst_ptr + (n >> DUVSHIFT) * BPP, temp + 192, \ |
124 SS(r, DUVSHIFT) * BPP); \ | 124 SS(r, DUVSHIFT) * BPP); \ |
125 } | 125 } |
126 | 126 |
127 #ifdef HAS_I422TOARGBROW_SSSE3 | 127 #ifdef HAS_I422TOARGBROW_SSSE3 |
128 ANY31C(I422ToARGBRow_Any_SSSE3, I422ToARGBRow_SSSE3, 1, 0, 4, 7) | 128 ANY31C(I422ToARGBRow_Any_SSSE3, I422ToARGBRow_SSSE3, 1, 0, 4, 7) |
129 #endif | 129 #endif |
130 #ifdef HAS_I411TOARGBROW_SSSE3 | |
131 ANY31C(I411ToARGBRow_Any_SSSE3, I411ToARGBRow_SSSE3, 2, 0, 4, 7) | |
132 #endif | |
133 #ifdef HAS_I444TOARGBROW_SSSE3 | 130 #ifdef HAS_I444TOARGBROW_SSSE3 |
134 ANY31C(I444ToARGBRow_Any_SSSE3, I444ToARGBRow_SSSE3, 0, 0, 4, 7) | 131 ANY31C(I444ToARGBRow_Any_SSSE3, I444ToARGBRow_SSSE3, 0, 0, 4, 7) |
135 ANY31C(I422ToRGBARow_Any_SSSE3, I422ToRGBARow_SSSE3, 1, 0, 4, 7) | 132 ANY31C(I422ToRGBARow_Any_SSSE3, I422ToRGBARow_SSSE3, 1, 0, 4, 7) |
136 ANY31C(I422ToARGB4444Row_Any_SSSE3, I422ToARGB4444Row_SSSE3, 1, 0, 2, 7) | 133 ANY31C(I422ToARGB4444Row_Any_SSSE3, I422ToARGB4444Row_SSSE3, 1, 0, 2, 7) |
137 ANY31C(I422ToARGB1555Row_Any_SSSE3, I422ToARGB1555Row_SSSE3, 1, 0, 2, 7) | 134 ANY31C(I422ToARGB1555Row_Any_SSSE3, I422ToARGB1555Row_SSSE3, 1, 0, 2, 7) |
138 ANY31C(I422ToRGB565Row_Any_SSSE3, I422ToRGB565Row_SSSE3, 1, 0, 2, 7) | 135 ANY31C(I422ToRGB565Row_Any_SSSE3, I422ToRGB565Row_SSSE3, 1, 0, 2, 7) |
139 ANY31C(I422ToRGB24Row_Any_SSSE3, I422ToRGB24Row_SSSE3, 1, 0, 3, 7) | 136 ANY31C(I422ToRGB24Row_Any_SSSE3, I422ToRGB24Row_SSSE3, 1, 0, 3, 7) |
140 #endif // HAS_I444TOARGBROW_SSSE3 | 137 #endif // HAS_I444TOARGBROW_SSSE3 |
141 #ifdef HAS_I422TORGB24ROW_AVX2 | 138 #ifdef HAS_I422TORGB24ROW_AVX2 |
142 ANY31C(I422ToRGB24Row_Any_AVX2, I422ToRGB24Row_AVX2, 1, 0, 3, 15) | 139 ANY31C(I422ToRGB24Row_Any_AVX2, I422ToRGB24Row_AVX2, 1, 0, 3, 15) |
143 #endif | 140 #endif |
144 #ifdef HAS_I422TOARGBROW_AVX2 | 141 #ifdef HAS_I422TOARGBROW_AVX2 |
145 ANY31C(I422ToARGBRow_Any_AVX2, I422ToARGBRow_AVX2, 1, 0, 4, 15) | 142 ANY31C(I422ToARGBRow_Any_AVX2, I422ToARGBRow_AVX2, 1, 0, 4, 15) |
146 #endif | 143 #endif |
147 #ifdef HAS_I422TORGBAROW_AVX2 | 144 #ifdef HAS_I422TORGBAROW_AVX2 |
148 ANY31C(I422ToRGBARow_Any_AVX2, I422ToRGBARow_AVX2, 1, 0, 4, 15) | 145 ANY31C(I422ToRGBARow_Any_AVX2, I422ToRGBARow_AVX2, 1, 0, 4, 15) |
149 #endif | 146 #endif |
150 #ifdef HAS_I444TOARGBROW_AVX2 | 147 #ifdef HAS_I444TOARGBROW_AVX2 |
151 ANY31C(I444ToARGBRow_Any_AVX2, I444ToARGBRow_AVX2, 0, 0, 4, 15) | 148 ANY31C(I444ToARGBRow_Any_AVX2, I444ToARGBRow_AVX2, 0, 0, 4, 15) |
152 #endif | 149 #endif |
153 #ifdef HAS_I411TOARGBROW_AVX2 | |
154 ANY31C(I411ToARGBRow_Any_AVX2, I411ToARGBRow_AVX2, 2, 0, 4, 15) | |
155 #endif | |
156 #ifdef HAS_I422TOARGB4444ROW_AVX2 | 150 #ifdef HAS_I422TOARGB4444ROW_AVX2 |
157 ANY31C(I422ToARGB4444Row_Any_AVX2, I422ToARGB4444Row_AVX2, 1, 0, 2, 7) | 151 ANY31C(I422ToARGB4444Row_Any_AVX2, I422ToARGB4444Row_AVX2, 1, 0, 2, 7) |
158 #endif | 152 #endif |
159 #ifdef HAS_I422TOARGB1555ROW_AVX2 | 153 #ifdef HAS_I422TOARGB1555ROW_AVX2 |
160 ANY31C(I422ToARGB1555Row_Any_AVX2, I422ToARGB1555Row_AVX2, 1, 0, 2, 7) | 154 ANY31C(I422ToARGB1555Row_Any_AVX2, I422ToARGB1555Row_AVX2, 1, 0, 2, 7) |
161 #endif | 155 #endif |
162 #ifdef HAS_I422TORGB565ROW_AVX2 | 156 #ifdef HAS_I422TORGB565ROW_AVX2 |
163 ANY31C(I422ToRGB565Row_Any_AVX2, I422ToRGB565Row_AVX2, 1, 0, 2, 7) | 157 ANY31C(I422ToRGB565Row_Any_AVX2, I422ToRGB565Row_AVX2, 1, 0, 2, 7) |
164 #endif | 158 #endif |
165 #ifdef HAS_I422TOARGBROW_NEON | 159 #ifdef HAS_I422TOARGBROW_NEON |
166 ANY31C(I444ToARGBRow_Any_NEON, I444ToARGBRow_NEON, 0, 0, 4, 7) | 160 ANY31C(I444ToARGBRow_Any_NEON, I444ToARGBRow_NEON, 0, 0, 4, 7) |
167 ANY31C(I422ToARGBRow_Any_NEON, I422ToARGBRow_NEON, 1, 0, 4, 7) | 161 ANY31C(I422ToARGBRow_Any_NEON, I422ToARGBRow_NEON, 1, 0, 4, 7) |
168 ANY31C(I411ToARGBRow_Any_NEON, I411ToARGBRow_NEON, 2, 0, 4, 7) | |
169 ANY31C(I422ToRGBARow_Any_NEON, I422ToRGBARow_NEON, 1, 0, 4, 7) | 162 ANY31C(I422ToRGBARow_Any_NEON, I422ToRGBARow_NEON, 1, 0, 4, 7) |
170 ANY31C(I422ToRGB24Row_Any_NEON, I422ToRGB24Row_NEON, 1, 0, 3, 7) | 163 ANY31C(I422ToRGB24Row_Any_NEON, I422ToRGB24Row_NEON, 1, 0, 3, 7) |
171 ANY31C(I422ToARGB4444Row_Any_NEON, I422ToARGB4444Row_NEON, 1, 0, 2, 7) | 164 ANY31C(I422ToARGB4444Row_Any_NEON, I422ToARGB4444Row_NEON, 1, 0, 2, 7) |
172 ANY31C(I422ToARGB1555Row_Any_NEON, I422ToARGB1555Row_NEON, 1, 0, 2, 7) | 165 ANY31C(I422ToARGB1555Row_Any_NEON, I422ToARGB1555Row_NEON, 1, 0, 2, 7) |
173 ANY31C(I422ToRGB565Row_Any_NEON, I422ToRGB565Row_NEON, 1, 0, 2, 7) | 166 ANY31C(I422ToRGB565Row_Any_NEON, I422ToRGB565Row_NEON, 1, 0, 2, 7) |
174 #endif | 167 #endif |
175 #undef ANY31C | 168 #undef ANY31C |
176 | 169 |
177 // Any 2 planes to 1. | 170 // Any 2 planes to 1. |
178 #define ANY21(NAMEANY, ANY_SIMD, UVSHIFT, SBPP, SBPP2, BPP, MASK) \ | 171 #define ANY21(NAMEANY, ANY_SIMD, UVSHIFT, SBPP, SBPP2, BPP, MASK) \ |
(...skipping 534 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
713 #define ANY12(NAMEANY, ANY_SIMD, UVSHIFT, BPP, DUVSHIFT, MASK) \ | 706 #define ANY12(NAMEANY, ANY_SIMD, UVSHIFT, BPP, DUVSHIFT, MASK) \ |
714 void NAMEANY(const uint8* src_ptr, uint8* dst_u, uint8* dst_v, int width) {\ | 707 void NAMEANY(const uint8* src_ptr, uint8* dst_u, uint8* dst_v, int width) {\ |
715 SIMD_ALIGNED(uint8 temp[128 * 3]); \ | 708 SIMD_ALIGNED(uint8 temp[128 * 3]); \ |
716 memset(temp, 0, 128); /* for msan */ \ | 709 memset(temp, 0, 128); /* for msan */ \ |
717 int r = width & MASK; \ | 710 int r = width & MASK; \ |
718 int n = width & ~MASK; \ | 711 int n = width & ~MASK; \ |
719 if (n > 0) { \ | 712 if (n > 0) { \ |
720 ANY_SIMD(src_ptr, dst_u, dst_v, n); \ | 713 ANY_SIMD(src_ptr, dst_u, dst_v, n); \ |
721 } \ | 714 } \ |
722 memcpy(temp, src_ptr + (n >> UVSHIFT) * BPP, SS(r, UVSHIFT) * BPP); \ | 715 memcpy(temp, src_ptr + (n >> UVSHIFT) * BPP, SS(r, UVSHIFT) * BPP); \ |
723 /* repeat last 4 - 12 bytes for 411 subsampler */ \ | |
724 if (((width & 3) == 1) && BPP == 4 && DUVSHIFT == 2) { \ | |
725 memcpy(temp + SS(r, UVSHIFT) * BPP, \ | |
726 temp + SS(r, UVSHIFT) * BPP - BPP, BPP); \ | |
727 memcpy(temp + SS(r, UVSHIFT) * BPP + BPP, \ | |
728 temp + SS(r, UVSHIFT) * BPP - BPP, BPP * 2); \ | |
729 } \ | |
730 if (((width & 3) == 2) && BPP == 4 && DUVSHIFT == 2) { \ | |
731 memcpy(temp + SS(r, UVSHIFT) * BPP, \ | |
732 temp + SS(r, UVSHIFT) * BPP - BPP * 2, BPP * 2); \ | |
733 } \ | |
734 if (((width & 3) == 3) && BPP == 4 && DUVSHIFT == 2) { \ | |
735 memcpy(temp + SS(r, UVSHIFT) * BPP, \ | |
736 temp + SS(r, UVSHIFT) * BPP - BPP, BPP); \ | |
737 } \ | |
738 ANY_SIMD(temp, temp + 128, temp + 256, MASK + 1); \ | 716 ANY_SIMD(temp, temp + 128, temp + 256, MASK + 1); \ |
739 memcpy(dst_u + (n >> DUVSHIFT), temp + 128, SS(r, DUVSHIFT)); \ | 717 memcpy(dst_u + (n >> DUVSHIFT), temp + 128, SS(r, DUVSHIFT)); \ |
740 memcpy(dst_v + (n >> DUVSHIFT), temp + 256, SS(r, DUVSHIFT)); \ | 718 memcpy(dst_v + (n >> DUVSHIFT), temp + 256, SS(r, DUVSHIFT)); \ |
741 } | 719 } |
742 | 720 |
743 #ifdef HAS_SPLITUVROW_SSE2 | 721 #ifdef HAS_SPLITUVROW_SSE2 |
744 ANY12(SplitUVRow_Any_SSE2, SplitUVRow_SSE2, 0, 2, 0, 15) | 722 ANY12(SplitUVRow_Any_SSE2, SplitUVRow_SSE2, 0, 2, 0, 15) |
745 #endif | 723 #endif |
746 #ifdef HAS_SPLITUVROW_AVX2 | 724 #ifdef HAS_SPLITUVROW_AVX2 |
747 ANY12(SplitUVRow_Any_AVX2, SplitUVRow_AVX2, 0, 2, 0, 31) | 725 ANY12(SplitUVRow_Any_AVX2, SplitUVRow_AVX2, 0, 2, 0, 31) |
(...skipping 10 matching lines...) Expand all Loading... |
758 #ifdef HAS_YUY2TOUV422ROW_AVX2 | 736 #ifdef HAS_YUY2TOUV422ROW_AVX2 |
759 ANY12(YUY2ToUV422Row_Any_AVX2, YUY2ToUV422Row_AVX2, 1, 4, 1, 31) | 737 ANY12(YUY2ToUV422Row_Any_AVX2, YUY2ToUV422Row_AVX2, 1, 4, 1, 31) |
760 ANY12(UYVYToUV422Row_Any_AVX2, UYVYToUV422Row_AVX2, 1, 4, 1, 31) | 738 ANY12(UYVYToUV422Row_Any_AVX2, UYVYToUV422Row_AVX2, 1, 4, 1, 31) |
761 #endif | 739 #endif |
762 #ifdef HAS_YUY2TOUV422ROW_SSE2 | 740 #ifdef HAS_YUY2TOUV422ROW_SSE2 |
763 ANY12(YUY2ToUV422Row_Any_SSE2, YUY2ToUV422Row_SSE2, 1, 4, 1, 15) | 741 ANY12(YUY2ToUV422Row_Any_SSE2, YUY2ToUV422Row_SSE2, 1, 4, 1, 15) |
764 ANY12(UYVYToUV422Row_Any_SSE2, UYVYToUV422Row_SSE2, 1, 4, 1, 15) | 742 ANY12(UYVYToUV422Row_Any_SSE2, UYVYToUV422Row_SSE2, 1, 4, 1, 15) |
765 #endif | 743 #endif |
766 #ifdef HAS_YUY2TOUV422ROW_NEON | 744 #ifdef HAS_YUY2TOUV422ROW_NEON |
767 ANY12(ARGBToUV444Row_Any_NEON, ARGBToUV444Row_NEON, 0, 4, 0, 7) | 745 ANY12(ARGBToUV444Row_Any_NEON, ARGBToUV444Row_NEON, 0, 4, 0, 7) |
768 ANY12(ARGBToUV411Row_Any_NEON, ARGBToUV411Row_NEON, 0, 4, 2, 31) | |
769 ANY12(YUY2ToUV422Row_Any_NEON, YUY2ToUV422Row_NEON, 1, 4, 1, 15) | 746 ANY12(YUY2ToUV422Row_Any_NEON, YUY2ToUV422Row_NEON, 1, 4, 1, 15) |
770 ANY12(UYVYToUV422Row_Any_NEON, UYVYToUV422Row_NEON, 1, 4, 1, 15) | 747 ANY12(UYVYToUV422Row_Any_NEON, UYVYToUV422Row_NEON, 1, 4, 1, 15) |
771 #endif | 748 #endif |
772 #ifdef HAS_YUY2TOUV422ROW_MSA | 749 #ifdef HAS_YUY2TOUV422ROW_MSA |
773 ANY12(YUY2ToUV422Row_Any_MSA, YUY2ToUV422Row_MSA, 1, 4, 1, 31) | 750 ANY12(YUY2ToUV422Row_Any_MSA, YUY2ToUV422Row_MSA, 1, 4, 1, 31) |
774 ANY12(UYVYToUV422Row_Any_MSA, UYVYToUV422Row_MSA, 1, 4, 1, 31) | 751 ANY12(UYVYToUV422Row_Any_MSA, UYVYToUV422Row_MSA, 1, 4, 1, 31) |
775 #endif | 752 #endif |
776 #undef ANY12 | 753 #undef ANY12 |
777 | 754 |
778 // Any 1 to 2 with source stride (2 rows of source). Outputs UV planes. | 755 // Any 1 to 2 with source stride (2 rows of source). Outputs UV planes. |
(...skipping 84 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
863 #endif | 840 #endif |
864 #ifdef HAS_UYVYTOUVROW_MSA | 841 #ifdef HAS_UYVYTOUVROW_MSA |
865 ANY12S(UYVYToUVRow_Any_MSA, UYVYToUVRow_MSA, 1, 4, 31) | 842 ANY12S(UYVYToUVRow_Any_MSA, UYVYToUVRow_MSA, 1, 4, 31) |
866 #endif | 843 #endif |
867 #undef ANY12S | 844 #undef ANY12S |
868 | 845 |
869 #ifdef __cplusplus | 846 #ifdef __cplusplus |
870 } // extern "C" | 847 } // extern "C" |
871 } // namespace libyuv | 848 } // namespace libyuv |
872 #endif | 849 #endif |
OLD | NEW |