OLD | NEW |
1 /* | 1 /* |
2 * Copyright 2011 The LibYuv Project Authors. All rights reserved. | 2 * Copyright 2011 The LibYuv Project Authors. All rights reserved. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license | 4 * Use of this source code is governed by a BSD-style license |
5 * that can be found in the LICENSE file in the root of the source | 5 * that can be found in the LICENSE file in the root of the source |
6 * tree. An additional intellectual property rights grant can be found | 6 * tree. An additional intellectual property rights grant can be found |
7 * in the file PATENTS. All contributing project authors may | 7 * in the file PATENTS. All contributing project authors may |
8 * be found in the AUTHORS file in the root of the source tree. | 8 * be found in the AUTHORS file in the root of the source tree. |
9 */ | 9 */ |
10 | 10 |
(...skipping 594 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
605 "vmov q11, q2 \n" | 605 "vmov q11, q2 \n" |
606 "vuzp.16 q10, q11 \n" | 606 "vuzp.16 q10, q11 \n" |
607 "vmovl.u8 q8, d6 \n" | 607 "vmovl.u8 q8, d6 \n" |
608 "vmovl.u8 q9, d7 \n" | 608 "vmovl.u8 q9, d7 \n" |
609 "vsubl.s16 q11, d18, d16 \n" | 609 "vsubl.s16 q11, d18, d16 \n" |
610 "vsubl.s16 q12, d19, d17 \n" | 610 "vsubl.s16 q12, d19, d17 \n" |
611 "vmovl.u16 q13, d20 \n" | 611 "vmovl.u16 q13, d20 \n" |
612 "vmovl.u16 q10, d21 \n" | 612 "vmovl.u16 q10, d21 \n" |
613 "vmul.s32 q11, q11, q13 \n" | 613 "vmul.s32 q11, q11, q13 \n" |
614 "vmul.s32 q12, q12, q10 \n" | 614 "vmul.s32 q12, q12, q10 \n" |
615 "vshrn.s32 d18, q11, #16 \n" | 615 "vrshrn.s32 d18, q11, #16 \n" |
616 "vshrn.s32 d19, q12, #16 \n" | 616 "vrshrn.s32 d19, q12, #16 \n" |
617 "vadd.s16 q8, q8, q9 \n" | 617 "vadd.s16 q8, q8, q9 \n" |
618 "vmovn.s16 d6, q8 \n" | 618 "vmovn.s16 d6, q8 \n" |
619 | 619 |
620 MEMACCESS(0) | 620 MEMACCESS(0) |
621 "vst1.8 {d6}, [%0]! \n" // store pixels | 621 "vst1.8 {d6}, [%0]! \n" // store pixels |
622 "vadd.s32 q1, q1, q0 \n" | 622 "vadd.s32 q1, q1, q0 \n" |
623 "vadd.s32 q2, q2, q0 \n" | 623 "vadd.s32 q2, q2, q0 \n" |
624 "subs %2, %2, #8 \n" // 8 processed per loop | 624 "subs %2, %2, #8 \n" // 8 processed per loop |
625 "bgt 1b \n" | 625 "bgt 1b \n" |
626 : "+r"(dst_ptr), // %0 | 626 : "+r"(dst_ptr), // %0 |
(...skipping 385 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1012 } | 1012 } |
1013 | 1013 |
1014 #undef LOAD2_DATA32_LANE | 1014 #undef LOAD2_DATA32_LANE |
1015 | 1015 |
1016 #endif // defined(__ARM_NEON__) && !defined(__aarch64__) | 1016 #endif // defined(__ARM_NEON__) && !defined(__aarch64__) |
1017 | 1017 |
1018 #ifdef __cplusplus | 1018 #ifdef __cplusplus |
1019 } // extern "C" | 1019 } // extern "C" |
1020 } // namespace libyuv | 1020 } // namespace libyuv |
1021 #endif | 1021 #endif |
OLD | NEW |