Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(93)

Side by Side Diff: source/row_any.cc

Issue 1513443002: Optimize BlendPlane SIMD support for odd width. (Closed) Base URL: https://chromium.googlesource.com/libyuv/libyuv@master
Patch Set: Created 5 years ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« source/planar_functions.cc ('K') | « source/planar_functions.cc ('k') | no next file » | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 /* 1 /*
2 * Copyright 2012 The LibYuv Project Authors. All rights reserved. 2 * Copyright 2012 The LibYuv Project Authors. All rights reserved.
3 * 3 *
4 * Use of this source code is governed by a BSD-style license 4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source 5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found 6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may 7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree. 8 * be found in the AUTHORS file in the root of the source tree.
9 */ 9 */
10 10
(...skipping 65 matching lines...) Expand 10 before | Expand all | Expand 10 after
76 #ifdef HAS_I422TOYUY2ROW_SSE2 76 #ifdef HAS_I422TOYUY2ROW_SSE2
77 ANY31(I422ToYUY2Row_Any_SSE2, I422ToYUY2Row_SSE2, 1, 1, 4, 15) 77 ANY31(I422ToYUY2Row_Any_SSE2, I422ToYUY2Row_SSE2, 1, 1, 4, 15)
78 ANY31(I422ToUYVYRow_Any_SSE2, I422ToUYVYRow_SSE2, 1, 1, 4, 15) 78 ANY31(I422ToUYVYRow_Any_SSE2, I422ToUYVYRow_SSE2, 1, 1, 4, 15)
79 #endif 79 #endif
80 #ifdef HAS_I422TOYUY2ROW_NEON 80 #ifdef HAS_I422TOYUY2ROW_NEON
81 ANY31(I422ToYUY2Row_Any_NEON, I422ToYUY2Row_NEON, 1, 1, 4, 15) 81 ANY31(I422ToYUY2Row_Any_NEON, I422ToYUY2Row_NEON, 1, 1, 4, 15)
82 #endif 82 #endif
83 #ifdef HAS_I422TOUYVYROW_NEON 83 #ifdef HAS_I422TOUYVYROW_NEON
84 ANY31(I422ToUYVYRow_Any_NEON, I422ToUYVYRow_NEON, 1, 1, 4, 15) 84 ANY31(I422ToUYVYRow_Any_NEON, I422ToUYVYRow_NEON, 1, 1, 4, 15)
85 #endif 85 #endif
86 #ifdef HAS_BLENDPLANEROW_AVX2
87 ANY31(BlendPlaneRow_Any_AVX2, BlendPlaneRow_AVX2, 0, 0, 1, 31)
88 #endif
89 #ifdef HAS_BLENDPLANEROW_SSSE3
90 ANY31(BlendPlaneRow_Any_SSSE3, BlendPlaneRow_SSSE3, 0, 0, 1, 7)
91 #endif
86 #undef ANY31 92 #undef ANY31
87 93
94 void BlendPlaneRow_Any_AVX2(const uint8* src0, const uint8* src1,
95 const uint8* alpha, uint8* dst, int width);
96
97
88 // Note that odd width replication includes 444 due to implementation 98 // Note that odd width replication includes 444 due to implementation
89 // on arm that subsamples 444 to 422 internally. 99 // on arm that subsamples 444 to 422 internally.
90 // Any 3 planes to 1 with yuvconstants 100 // Any 3 planes to 1 with yuvconstants
91 #define ANY31C(NAMEANY, ANY_SIMD, UVSHIFT, DUVSHIFT, BPP, MASK) \ 101 #define ANY31C(NAMEANY, ANY_SIMD, UVSHIFT, DUVSHIFT, BPP, MASK) \
92 void NAMEANY(const uint8* y_buf, const uint8* u_buf, const uint8* v_buf, \ 102 void NAMEANY(const uint8* y_buf, const uint8* u_buf, const uint8* v_buf, \
93 uint8* dst_ptr, const struct YuvConstants* yuvconstants, \ 103 uint8* dst_ptr, const struct YuvConstants* yuvconstants, \
94 int width) { \ 104 int width) { \
95 SIMD_ALIGNED(uint8 temp[64 * 4]); \ 105 SIMD_ALIGNED(uint8 temp[64 * 4]); \
96 memset(temp, 0, 64 * 3); /* for YUY2 and msan */ \ 106 memset(temp, 0, 64 * 3); /* for YUY2 and msan */ \
97 int r = width & MASK; \ 107 int r = width & MASK; \
(...skipping 709 matching lines...) Expand 10 before | Expand all | Expand 10 after
807 #endif 817 #endif
808 #ifdef HAS_UYVYTOUVROW_NEON 818 #ifdef HAS_UYVYTOUVROW_NEON
809 ANY12S(UYVYToUVRow_Any_NEON, UYVYToUVRow_NEON, 1, 4, 15) 819 ANY12S(UYVYToUVRow_Any_NEON, UYVYToUVRow_NEON, 1, 4, 15)
810 #endif 820 #endif
811 #undef ANY12S 821 #undef ANY12S
812 822
813 #ifdef __cplusplus 823 #ifdef __cplusplus
814 } // extern "C" 824 } // extern "C"
815 } // namespace libyuv 825 } // namespace libyuv
816 #endif 826 #endif
OLDNEW
« source/planar_functions.cc ('K') | « source/planar_functions.cc ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698