libvpx/source/libvpx/vp8/encoder/arm/neon/vp8_mse16x16_neon.asm - Issue 7624054: Revert r97185 "Update libvpx snapshot to v0.9.7-p1 (Cayuga)."

Keyboard Shortcuts

	File
u :	up to issue
j / k :	jump to file after / before current file
J / K :	jump to next file with a comment after / before current file
	Side-by-side diff
i :	toggle intra-line diffs
e :	expand all comments
c :	collapse all comments
s :	toggle showing all comments
n / p :	next / previous diff chunk or comment
N / P :	next / previous comment
<Up> / <Down> :	next / previous line

	Issue
u :	up to list of issues
j / k :	jump to patch after / before current patch
o / <Enter> :	open current patch in side-by-side view
i :	open current patch in unified diff view

	Issue List
j / k :	jump to issue after / before current issue
o / <Enter> :	open current issue

Unified Diff: libvpx/source/libvpx/vp8/encoder/arm/neon/vp8_mse16x16_neon.asm

Issue 7624054: Revert r97185 "Update libvpx snapshot to v0.9.7-p1 (Cayuga)." (Closed) Base URL: svn://chrome-svn/chrome/trunk/deps/third_party

Patch Set: Created 9 years, 4 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « libvpx/source/libvpx/vp8/encoder/arm/neon/fastquantizeb_neon.asm ('k') | libvpx/source/libvpx/vp8/encoder/arm/quantize_arm.h » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: libvpx/source/libvpx/vp8/encoder/arm/neon/vp8_mse16x16_neon.asm

diff --git a/libvpx/source/libvpx/vp8/encoder/arm/neon/vp8_mse16x16_neon.asm b/libvpx/source/libvpx/vp8/encoder/arm/neon/vp8_mse16x16_neon.asm

index 55edbf5129ed013ffa0b5ea32c5aa6682ad24e6c..6af4e87bab62f9609d78b7d6de7efdcc833cf7b3 100644

--- a/libvpx/source/libvpx/vp8/encoder/arm/neon/vp8_mse16x16_neon.asm

+++ b/libvpx/source/libvpx/vp8/encoder/arm/neon/vp8_mse16x16_neon.asm

@@ -10,6 +10,7 @@

EXPORT |vp8_mse16x16_neon|

+ EXPORT |vp8_get16x16pred_error_neon|

EXPORT |vp8_get4x4sse_cs_neon|

ARM

@@ -75,6 +76,62 @@ mse16x16_neon_loop

ENDP

+;============================

+; r0 unsigned char *src_ptr

+; r1 int src_stride

+; r2 unsigned char *ref_ptr

+; r3 int ref_stride

+|vp8_get16x16pred_error_neon| PROC

+ vmov.i8 q8, #0 ;q8 - sum

+ vmov.i8 q9, #0 ;q9, q10 - pred_error

+ vmov.i8 q10, #0

+ mov r12, #8

+get16x16pred_error_neon_loop

+ vld1.8 {q0}, [r0], r1 ;Load up source and reference

+ vld1.8 {q2}, [r2], r3

+ vld1.8 {q1}, [r0], r1

+ vld1.8 {q3}, [r2], r3

+ vsubl.u8 q11, d0, d4

+ vsubl.u8 q12, d1, d5

+ vsubl.u8 q13, d2, d6

+ vsubl.u8 q14, d3, d7

+ vpadal.s16 q8, q11

+ vmlal.s16 q9, d22, d22

+ vmlal.s16 q10, d23, d23

+ subs r12, r12, #1

+ vpadal.s16 q8, q12

+ vmlal.s16 q9, d24, d24

+ vmlal.s16 q10, d25, d25

+ vpadal.s16 q8, q13

+ vmlal.s16 q9, d26, d26

+ vmlal.s16 q10, d27, d27

+ vpadal.s16 q8, q14

+ vmlal.s16 q9, d28, d28

+ vmlal.s16 q10, d29, d29

+ bne get16x16pred_error_neon_loop

+ vadd.u32 q10, q9, q10

+ vpaddl.s32 q0, q8

+ vpaddl.u32 q1, q10

+ vadd.s64 d0, d0, d1

+ vadd.u64 d1, d2, d3

+ vmull.s32 q5, d0, d0

+ vshr.s32 d10, d10, #8

+ vsub.s32 d0, d1, d10

+ vmov.32 r0, d0[0]

+ bx lr

+ ENDP

;=============================

; r0 unsigned char *src_ptr,