| Index: source/libvpx/vp9/common/arm/neon/vp9_short_idct16x16_add_neon.asm
|
| ===================================================================
|
| --- source/libvpx/vp9/common/arm/neon/vp9_short_idct16x16_add_neon.asm (revision 232232)
|
| +++ source/libvpx/vp9/common/arm/neon/vp9_short_idct16x16_add_neon.asm (working copy)
|
| @@ -8,12 +8,10 @@
|
| ; be found in the AUTHORS file in the root of the source tree.
|
| ;
|
|
|
| - EXPORT |vp9_short_idct16x16_add_neon_pass1|
|
| - EXPORT |vp9_short_idct16x16_add_neon_pass2|
|
| - EXPORT |vp9_short_idct10_16x16_add_neon_pass1|
|
| - EXPORT |vp9_short_idct10_16x16_add_neon_pass2|
|
| - EXPORT |save_neon_registers|
|
| - EXPORT |restore_neon_registers|
|
| + EXPORT |vp9_idct16x16_256_add_neon_pass1|
|
| + EXPORT |vp9_idct16x16_256_add_neon_pass2|
|
| + EXPORT |vp9_idct16x16_10_add_neon_pass1|
|
| + EXPORT |vp9_idct16x16_10_add_neon_pass2|
|
| ARM
|
| REQUIRE8
|
| PRESERVE8
|
| @@ -38,7 +36,7 @@
|
| MEND
|
|
|
| AREA Block, CODE, READONLY ; name this block of code
|
| -;void |vp9_short_idct16x16_add_neon_pass1|(int16_t *input,
|
| +;void |vp9_idct16x16_256_add_neon_pass1|(int16_t *input,
|
| ; int16_t *output, int output_stride)
|
| ;
|
| ; r0 int16_t input
|
| @@ -48,7 +46,7 @@
|
| ; idct16 stage1 - stage6 on all the elements loaded in q8-q15. The output
|
| ; will be stored back into q8-q15 registers. This function will touch q0-q7
|
| ; registers and use them as buffer during calculation.
|
| -|vp9_short_idct16x16_add_neon_pass1| PROC
|
| +|vp9_idct16x16_256_add_neon_pass1| PROC
|
|
|
| ; TODO(hkuang): Find a better way to load the elements.
|
| ; load elements of 0, 2, 4, 6, 8, 10, 12, 14 into q8 - q15
|
| @@ -275,9 +273,9 @@
|
| vst1.64 {d31}, [r1], r2
|
|
|
| bx lr
|
| - ENDP ; |vp9_short_idct16x16_add_neon_pass1|
|
| + ENDP ; |vp9_idct16x16_256_add_neon_pass1|
|
|
|
| -;void vp9_short_idct16x16_add_neon_pass2(int16_t *src,
|
| +;void vp9_idct16x16_256_add_neon_pass2(int16_t *src,
|
| ; int16_t *output,
|
| ; int16_t *pass1Output,
|
| ; int16_t skip_adding,
|
| @@ -294,7 +292,7 @@
|
| ; idct16 stage1 - stage7 on all the elements loaded in q8-q15. The output
|
| ; will be stored back into q8-q15 registers. This function will touch q0-q7
|
| ; registers and use them as buffer during calculation.
|
| -|vp9_short_idct16x16_add_neon_pass2| PROC
|
| +|vp9_idct16x16_256_add_neon_pass2| PROC
|
| push {r3-r9}
|
|
|
| ; TODO(hkuang): Find a better way to load the elements.
|
| @@ -786,9 +784,9 @@
|
| end_idct16x16_pass2
|
| pop {r3-r9}
|
| bx lr
|
| - ENDP ; |vp9_short_idct16x16_add_neon_pass2|
|
| + ENDP ; |vp9_idct16x16_256_add_neon_pass2|
|
|
|
| -;void |vp9_short_idct10_16x16_add_neon_pass1|(int16_t *input,
|
| +;void |vp9_idct16x16_10_add_neon_pass1|(int16_t *input,
|
| ; int16_t *output, int output_stride)
|
| ;
|
| ; r0 int16_t input
|
| @@ -798,7 +796,7 @@
|
| ; idct16 stage1 - stage6 on all the elements loaded in q8-q15. The output
|
| ; will be stored back into q8-q15 registers. This function will touch q0-q7
|
| ; registers and use them as buffer during calculation.
|
| -|vp9_short_idct10_16x16_add_neon_pass1| PROC
|
| +|vp9_idct16x16_10_add_neon_pass1| PROC
|
|
|
| ; TODO(hkuang): Find a better way to load the elements.
|
| ; load elements of 0, 2, 4, 6, 8, 10, 12, 14 into q8 - q15
|
| @@ -907,9 +905,9 @@
|
| vst1.64 {d31}, [r1], r2
|
|
|
| bx lr
|
| - ENDP ; |vp9_short_idct10_16x16_add_neon_pass1|
|
| + ENDP ; |vp9_idct16x16_10_add_neon_pass1|
|
|
|
| -;void vp9_short_idct10_16x16_add_neon_pass2(int16_t *src,
|
| +;void vp9_idct16x16_10_add_neon_pass2(int16_t *src,
|
| ; int16_t *output,
|
| ; int16_t *pass1Output,
|
| ; int16_t skip_adding,
|
| @@ -926,7 +924,7 @@
|
| ; idct16 stage1 - stage7 on all the elements loaded in q8-q15. The output
|
| ; will be stored back into q8-q15 registers. This function will touch q0-q7
|
| ; registers and use them as buffer during calculation.
|
| -|vp9_short_idct10_16x16_add_neon_pass2| PROC
|
| +|vp9_idct16x16_10_add_neon_pass2| PROC
|
| push {r3-r9}
|
|
|
| ; TODO(hkuang): Find a better way to load the elements.
|
| @@ -1177,15 +1175,5 @@
|
| end_idct10_16x16_pass2
|
| pop {r3-r9}
|
| bx lr
|
| - ENDP ; |vp9_short_idct10_16x16_add_neon_pass2|
|
| -;void |save_neon_registers|()
|
| -|save_neon_registers| PROC
|
| - vpush {d8-d15}
|
| - bx lr
|
| - ENDP ; |save_registers|
|
| -;void |restore_neon_registers|()
|
| -|restore_neon_registers| PROC
|
| - vpop {d8-d15}
|
| - bx lr
|
| - ENDP ; |restore_registers|
|
| + ENDP ; |vp9_idct16x16_10_add_neon_pass2|
|
| END
|
|
|