source/libvpx/vp8/encoder/arm/armv6/vp8_variance_halfpixvar16x16_v_armv6.asm - Issue 7671004: Update libvpx snapshot to v0.9.7-p1 (Cayuga).

Side by Side Diff: source/libvpx/vp8/encoder/arm/armv6/vp8_variance_halfpixvar16x16_v_armv6.asm

Issue 7671004: Update libvpx snapshot to v0.9.7-p1 (Cayuga). (Closed) Base URL: svn://chrome-svn/chrome/trunk/deps/third_party/libvpx/

Patch Set: '' Created 9 years, 4 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View unified diff | Download patch | Annotate | Revision Log

« no previous file with comments | « source/libvpx/vp8/encoder/arm/armv6/vp8_variance_halfpixvar16x16_hv_armv6.asm ('k') | source/libvpx/vp8/encoder/arm/neon/fastquantizeb_neon.asm » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

OLD	NEW
1 ;	1 ;

2 ; Copyright (c) 2011 The WebM project authors. All Rights Reserved.	2 ; Copyright (c) 2011 The WebM project authors. All Rights Reserved.

3 ;	3 ;

4 ; Use of this source code is governed by a BSD-style license	4 ; Use of this source code is governed by a BSD-style license

5 ; that can be found in the LICENSE file in the root of the source	5 ; that can be found in the LICENSE file in the root of the source

6 ; tree. An additional intellectual property rights grant can be found	6 ; tree. An additional intellectual property rights grant can be found

7 ; in the file PATENTS. All contributing project authors may	7 ; in the file PATENTS. All contributing project authors may

8 ; be found in the AUTHORS file in the root of the source tree.	8 ; be found in the AUTHORS file in the root of the source tree.

9 ;	9 ;

10	10

11	11

12 EXPORT \|vp8_variance_halfpixvar16x16_v_armv6\|	12 EXPORT \|vp8_variance_halfpixvar16x16_v_armv6\|

13	13

14 ARM	14 ARM

15 REQUIRE8	15 REQUIRE8

16 PRESERVE8	16 PRESERVE8

17	17

18 AREA \|\|.text\|\|, CODE, READONLY, ALIGN=2	18 AREA \|\|.text\|\|, CODE, READONLY, ALIGN=2

19	19

20 ; r0 unsigned char *src_ptr	20 ; r0 unsigned char *src_ptr

21 ; r1 int source_stride	21 ; r1 int source_stride

22 ; r2 unsigned char *ref_ptr	22 ; r2 unsigned char *ref_ptr

23 ; r3 int recon_stride	23 ; r3 int recon_stride

24 ; stack unsigned int *sse	24 ; stack unsigned int *sse

25 \|vp8_variance_halfpixvar16x16_v_armv6\| PROC	25 \|vp8_variance_halfpixvar16x16_v_armv6\| PROC

26	26

27 stmfd sp!, {r4-r12, lr}	27 stmfd sp!, {r4-r12, lr}

	28

	29 pld [r0, r1, lsl #0]

	30 pld [r2, r3, lsl #0]

	31

28 mov r8, #0 ; initialize sum = 0	32 mov r8, #0 ; initialize sum = 0

29 ldr r10, c80808080	33 ldr r10, c80808080

30 mov r11, #0 ; initialize sse = 0	34 mov r11, #0 ; initialize sse = 0

31 mov r12, #16 ; set loop counter to 16 (=block height)	35 mov r12, #16 ; set loop counter to 16 (=block height)

32 mov lr, #0 ; constant zero	36 mov lr, #0 ; constant zero

33 loop	37 loop

34 add r9, r0, r1 ; set src pointer to next row	38 add r9, r0, r1 ; set src pointer to next row

35 ; 1st 4 pixels	39 ; 1st 4 pixels

36 ldr r4, [r0, #0] ; load 4 src pixels	40 ldr r4, [r0, #0] ; load 4 src pixels

37 ldr r6, [r9, #0] ; load 4 src pixels from next row	41 ldr r6, [r9, #0] ; load 4 src pixels from next row

38 ldr r5, [r2, #0] ; load 4 ref pixels	42 ldr r5, [r2, #0] ; load 4 ref pixels

39	43

40 ; bilinear interpolation	44 ; bilinear interpolation

41 mvn r6, r6	45 mvn r6, r6

42 uhsub8 r4, r4, r6	46 uhsub8 r4, r4, r6

43 eor r4, r4, r10	47 eor r4, r4, r10

44	48

45 usub8 r6, r4, r5 ; calculate difference	49 usub8 r6, r4, r5 ; calculate difference

	50 pld [r0, r1, lsl #1]

46 sel r7, r6, lr ; select bytes with positive difference	51 sel r7, r6, lr ; select bytes with positive difference

47 usub8 r6, r5, r4 ; calculate difference with reversed operands	52 usub8 r6, r5, r4 ; calculate difference with reversed operands

	53 pld [r2, r3, lsl #1]

48 sel r6, r6, lr ; select bytes with negative difference	54 sel r6, r6, lr ; select bytes with negative difference

49	55

50 ; calculate partial sums	56 ; calculate partial sums

51 usad8 r4, r7, lr ; calculate sum of positive differences	57 usad8 r4, r7, lr ; calculate sum of positive differences

52 usad8 r5, r6, lr ; calculate sum of negative differences	58 usad8 r5, r6, lr ; calculate sum of negative differences

53 orr r6, r6, r7 ; differences of all 4 pixels	59 orr r6, r6, r7 ; differences of all 4 pixels

54 ; calculate total sum	60 ; calculate total sum

55 adds r8, r8, r4 ; add positive differences to sum	61 adds r8, r8, r4 ; add positive differences to sum

56 subs r8, r8, r5 ; substract negative differences from sum	62 subs r8, r8, r5 ; substract negative differences from sum

57	63

(...skipping 111 matching lines...) Expand 10 before \| Expand all \| Expand 10 after Loading...
169	175

170 ldmfd sp!, {r4-r12, pc}	176 ldmfd sp!, {r4-r12, pc}

171	177

172 ENDP	178 ENDP

173	179

174 c80808080	180 c80808080

175 DCD 0x80808080	181 DCD 0x80808080

176	182

177 END	183 END

178	184

OLD	NEW