| Index: source/libvpx/third_party/libyuv/source/compare_neon.cc
|
| diff --git a/source/libvpx/third_party/libyuv/source/compare_neon.cc b/source/libvpx/third_party/libyuv/source/compare_neon.cc
|
| index 55052c0eecb707aa7c2c5c8a3d7ae658a50ea739..ef006ec41cdc71cddfd3381bef19d8bc58ff874a 100644
|
| --- a/source/libvpx/third_party/libyuv/source/compare_neon.cc
|
| +++ b/source/libvpx/third_party/libyuv/source/compare_neon.cc
|
| @@ -16,7 +16,8 @@ namespace libyuv {
|
| extern "C" {
|
| #endif
|
|
|
| -#if !defined(LIBYUV_DISABLE_NEON) && defined(__ARM_NEON__)
|
| +#if !defined(LIBYUV_DISABLE_NEON) && defined(__ARM_NEON__) && \
|
| + !defined(__aarch64__)
|
|
|
| uint32 SumSquareError_NEON(const uint8* src_a, const uint8* src_b, int count) {
|
| volatile uint32 sse;
|
| @@ -56,46 +57,7 @@ uint32 SumSquareError_NEON(const uint8* src_a, const uint8* src_b, int count) {
|
| return sse;
|
| }
|
|
|
| -#elif !defined(LIBYUV_DISABLE_NEON) && defined(__aarch64__)
|
| -
|
| -uint32 SumSquareError_NEON(const uint8* src_a, const uint8* src_b, int count) {
|
| - volatile uint32 sse;
|
| - asm volatile (
|
| - "eor v16.16b, v16.16b, v16.16b \n"
|
| - "eor v18.16b, v18.16b, v18.16b \n"
|
| - "eor v17.16b, v17.16b, v17.16b \n"
|
| - "eor v19.16b, v19.16b, v19.16b \n"
|
| -
|
| - ".p2align 2 \n"
|
| - "1: \n"
|
| - MEMACCESS(0)
|
| - "ld1 {v0.16b}, [%0], #16 \n"
|
| - MEMACCESS(1)
|
| - "ld1 {v1.16b}, [%1], #16 \n"
|
| - "subs %2, %2, #16 \n"
|
| - "usubl v2.8h, v0.8b, v1.8b \n"
|
| - "usubl2 v3.8h, v0.16b, v1.16b \n"
|
| - "smlal v16.4s, v2.4h, v2.4h \n"
|
| - "smlal v17.4s, v3.4h, v3.4h \n"
|
| - "smlal2 v18.4s, v2.8h, v2.8h \n"
|
| - "smlal2 v19.4s, v3.8h, v3.8h \n"
|
| - "bgt 1b \n"
|
| -
|
| - "add v16.4s, v16.4s, v17.4s \n"
|
| - "add v18.4s, v18.4s, v19.4s \n"
|
| - "add v19.4s, v16.4s, v18.4s \n"
|
| - "addv s0, v19.4s \n"
|
| - "fmov %w3, s0 \n"
|
| - : "+r"(src_a),
|
| - "+r"(src_b),
|
| - "+r"(count),
|
| - "=r"(sse)
|
| - :
|
| - : "cc", "v0", "v1", "v2", "v3", "v16", "v17", "v18", "v19");
|
| - return sse;
|
| -}
|
| -
|
| -#endif // __ARM_NEON__
|
| +#endif // defined(__ARM_NEON__) && !defined(__aarch64__)
|
|
|
| #ifdef __cplusplus
|
| } // extern "C"
|
|
|