Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(38)

Side by Side Diff: source/row_neon64.cc

Issue 2035573002: ARGBExtractAlpha 16 pixels at a time for ARM (Closed) Base URL: https://chromium.googlesource.com/libyuv/libyuv@master
Patch Set: tested variations of 64 bit Created 4 years, 6 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« libyuv.gyp ('K') | « source/row_neon.cc ('k') | no next file » | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 /* 1 /*
2 * Copyright 2014 The LibYuv Project Authors. All rights reserved. 2 * Copyright 2014 The LibYuv Project Authors. All rights reserved.
3 * 3 *
4 * Use of this source code is governed by a BSD-style license 4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source 5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found 6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may 7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree. 8 * be found in the AUTHORS file in the root of the source tree.
9 */ 9 */
10 10
(...skipping 1386 matching lines...) Expand 10 before | Expand all | Expand 10 after
1397 : "cc", "memory", "v0", "v1", "v2", "v3", "v4", "v5", "v6", "v7" 1397 : "cc", "memory", "v0", "v1", "v2", "v3", "v4", "v5", "v6", "v7"
1398 ); 1398 );
1399 } 1399 }
1400 #endif // HAS_ARGBTOYROW_NEON 1400 #endif // HAS_ARGBTOYROW_NEON
1401 1401
1402 #ifdef HAS_ARGBEXTRACTALPHAROW_NEON 1402 #ifdef HAS_ARGBEXTRACTALPHAROW_NEON
1403 void ARGBExtractAlphaRow_NEON(const uint8* src_argb, uint8* dst_a, int width) { 1403 void ARGBExtractAlphaRow_NEON(const uint8* src_argb, uint8* dst_a, int width) {
1404 asm volatile ( 1404 asm volatile (
1405 "1: \n" 1405 "1: \n"
1406 MEMACCESS(0) 1406 MEMACCESS(0)
1407 "ld4 {v0.8b,v1.8b,v2.8b,v3.8b}, [%0], #32 \n" // load row 8 pixels 1407 "ld4 {v0.16b,v1.16b,v2.16b,v3.16b}, [%0], #64 \n" // load row 16 pix els
1408 "subs %w2, %w2, #8 \n" // 8 processed per loop 1408 "subs %w2, %w2, #16 \n" // 16 processed per loop
1409 MEMACCESS(1) 1409 MEMACCESS(1)
1410 "st1 {v3.8b}, [%1], #8 \n" // store 8 A's. 1410 "st1 {v3.16b}, [%1], #16 \n" // store 16 A's.
1411 "b.gt 1b \n" 1411 "b.gt 1b \n"
1412 : "+r"(src_argb), // %0 1412 : "+r"(src_argb), // %0
1413 "+r"(dst_a), // %1 1413 "+r"(dst_a), // %1
1414 "+r"(width) // %2 1414 "+r"(width) // %2
1415 : 1415 :
1416 : "cc", "memory", "v0", "v1", "v2", "v3" // Clobber List 1416 : "cc", "memory", "v0", "v1", "v2", "v3" // Clobber List
1417 ); 1417 );
1418 } 1418 }
1419 #endif // HAS_ARGBEXTRACTALPHAROW_NEON 1419 #endif // HAS_ARGBEXTRACTALPHAROW_NEON
1420 1420
(...skipping 1550 matching lines...) Expand 10 before | Expand all | Expand 10 after
2971 : "cc", "memory", "v0", "v1", "v2", "v3" // Clobber List 2971 : "cc", "memory", "v0", "v1", "v2", "v3" // Clobber List
2972 ); 2972 );
2973 } 2973 }
2974 #endif // HAS_SOBELYROW_NEON 2974 #endif // HAS_SOBELYROW_NEON
2975 #endif // !defined(LIBYUV_DISABLE_NEON) && defined(__aarch64__) 2975 #endif // !defined(LIBYUV_DISABLE_NEON) && defined(__aarch64__)
2976 2976
2977 #ifdef __cplusplus 2977 #ifdef __cplusplus
2978 } // extern "C" 2978 } // extern "C"
2979 } // namespace libyuv 2979 } // namespace libyuv
2980 #endif 2980 #endif
OLDNEW
« libyuv.gyp ('K') | « source/row_neon.cc ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698