| Index: source/libvpx/vp8/encoder/arm/armv6/vp8_sad16x16_armv6.asm
|
| ===================================================================
|
| --- source/libvpx/vp8/encoder/arm/armv6/vp8_sad16x16_armv6.asm (revision 96967)
|
| +++ source/libvpx/vp8/encoder/arm/armv6/vp8_sad16x16_armv6.asm (working copy)
|
| @@ -24,6 +24,12 @@
|
| ; stack max_sad (not used)
|
| |vp8_sad16x16_armv6| PROC
|
| stmfd sp!, {r4-r12, lr}
|
| +
|
| + pld [r0, r1, lsl #0]
|
| + pld [r2, r3, lsl #0]
|
| + pld [r0, r1, lsl #1]
|
| + pld [r2, r3, lsl #1]
|
| +
|
| mov r4, #0 ; sad = 0;
|
| mov r5, #8 ; loop count
|
|
|
| @@ -45,6 +51,9 @@
|
| add r0, r0, r1 ; set src pointer to next row
|
| add r2, r2, r3 ; set dst pointer to next row
|
|
|
| + pld [r0, r1, lsl #1]
|
| + pld [r2, r3, lsl #1]
|
| +
|
| usada8 r4, r10, r12, r4 ; calculate sad for 4 pixels
|
| usada8 r8, r11, lr, r8 ; calculate sad for 4 pixels
|
|
|
| @@ -70,6 +79,9 @@
|
| usada8 r4, r10, r12, r4 ; calculate sad for 4 pixels
|
| usada8 r8, r11, lr, r8 ; calculate sad for 4 pixels
|
|
|
| + pld [r0, r1, lsl #1]
|
| + pld [r2, r3, lsl #1]
|
| +
|
| subs r5, r5, #1 ; decrement loop counter
|
| add r4, r4, r8 ; add partial sad values
|
|
|
|
|