| OLD | NEW |
| (Empty) |
| 1 ; | |
| 2 ; Copyright (c) 2010 The WebM project authors. All Rights Reserved. | |
| 3 ; | |
| 4 ; Use of this source code is governed by a BSD-style license | |
| 5 ; that can be found in the LICENSE file in the root of the source | |
| 6 ; tree. An additional intellectual property rights grant can be found | |
| 7 ; in the file PATENTS. All contributing project authors may | |
| 8 ; be found in the AUTHORS file in the root of the source tree. | |
| 9 ; | |
| 10 | |
| 11 | |
| 12 EXPORT |vp8_memcpy_partial_neon| | |
| 13 | |
| 14 ARM | |
| 15 REQUIRE8 | |
| 16 PRESERVE8 | |
| 17 | |
| 18 AREA ||.text||, CODE, READONLY, ALIGN=2 | |
| 19 ;========================================= | |
| 20 ;this is not a full memcpy function!!! | |
| 21 ;void vp8_memcpy_partial_neon(unsigned char *dst_ptr, unsigned char *src_ptr, | |
| 22 ; int sz); | |
| 23 |vp8_memcpy_partial_neon| PROC | |
| 24 vpush {d8-d15} | |
| 25 ;pld [r1] ;preload pred data | |
| 26 ;pld [r1, #128] | |
| 27 ;pld [r1, #256] | |
| 28 ;pld [r1, #384] | |
| 29 | |
| 30 mov r12, r2, lsr #8 ;copy 256 bytes data at one
time | |
| 31 | |
| 32 memcpy_neon_loop | |
| 33 vld1.8 {q0, q1}, [r1]! ;load src data | |
| 34 subs r12, r12, #1 | |
| 35 vld1.8 {q2, q3}, [r1]! | |
| 36 vst1.8 {q0, q1}, [r0]! ;copy to dst_ptr | |
| 37 vld1.8 {q4, q5}, [r1]! | |
| 38 vst1.8 {q2, q3}, [r0]! | |
| 39 vld1.8 {q6, q7}, [r1]! | |
| 40 vst1.8 {q4, q5}, [r0]! | |
| 41 vld1.8 {q8, q9}, [r1]! | |
| 42 vst1.8 {q6, q7}, [r0]! | |
| 43 vld1.8 {q10, q11}, [r1]! | |
| 44 vst1.8 {q8, q9}, [r0]! | |
| 45 vld1.8 {q12, q13}, [r1]! | |
| 46 vst1.8 {q10, q11}, [r0]! | |
| 47 vld1.8 {q14, q15}, [r1]! | |
| 48 vst1.8 {q12, q13}, [r0]! | |
| 49 vst1.8 {q14, q15}, [r0]! | |
| 50 | |
| 51 ;pld [r1] ;preload pred data -- need t
o adjust for real device | |
| 52 ;pld [r1, #128] | |
| 53 ;pld [r1, #256] | |
| 54 ;pld [r1, #384] | |
| 55 | |
| 56 bne memcpy_neon_loop | |
| 57 | |
| 58 ands r3, r2, #0xff ;extra copy | |
| 59 beq done_copy_neon_loop | |
| 60 | |
| 61 extra_copy_neon_loop | |
| 62 vld1.8 {q0}, [r1]! ;load src data | |
| 63 subs r3, r3, #16 | |
| 64 vst1.8 {q0}, [r0]! | |
| 65 bne extra_copy_neon_loop | |
| 66 | |
| 67 done_copy_neon_loop | |
| 68 vpop {d8-d15} | |
| 69 bx lr | |
| 70 ENDP | |
| 71 | |
| 72 END | |
| OLD | NEW |