Index: source/libvpx/vp9/common/arm/neon/vp9_short_idct16x16_add_neon.asm |
=================================================================== |
--- source/libvpx/vp9/common/arm/neon/vp9_short_idct16x16_add_neon.asm (revision 232232) |
+++ source/libvpx/vp9/common/arm/neon/vp9_short_idct16x16_add_neon.asm (working copy) |
@@ -8,12 +8,10 @@ |
; be found in the AUTHORS file in the root of the source tree. |
; |
- EXPORT |vp9_short_idct16x16_add_neon_pass1| |
- EXPORT |vp9_short_idct16x16_add_neon_pass2| |
- EXPORT |vp9_short_idct10_16x16_add_neon_pass1| |
- EXPORT |vp9_short_idct10_16x16_add_neon_pass2| |
- EXPORT |save_neon_registers| |
- EXPORT |restore_neon_registers| |
+ EXPORT |vp9_idct16x16_256_add_neon_pass1| |
+ EXPORT |vp9_idct16x16_256_add_neon_pass2| |
+ EXPORT |vp9_idct16x16_10_add_neon_pass1| |
+ EXPORT |vp9_idct16x16_10_add_neon_pass2| |
ARM |
REQUIRE8 |
PRESERVE8 |
@@ -38,7 +36,7 @@ |
MEND |
AREA Block, CODE, READONLY ; name this block of code |
-;void |vp9_short_idct16x16_add_neon_pass1|(int16_t *input, |
+;void |vp9_idct16x16_256_add_neon_pass1|(int16_t *input, |
; int16_t *output, int output_stride) |
; |
; r0 int16_t input |
@@ -48,7 +46,7 @@ |
; idct16 stage1 - stage6 on all the elements loaded in q8-q15. The output |
; will be stored back into q8-q15 registers. This function will touch q0-q7 |
; registers and use them as buffer during calculation. |
-|vp9_short_idct16x16_add_neon_pass1| PROC |
+|vp9_idct16x16_256_add_neon_pass1| PROC |
; TODO(hkuang): Find a better way to load the elements. |
; load elements of 0, 2, 4, 6, 8, 10, 12, 14 into q8 - q15 |
@@ -275,9 +273,9 @@ |
vst1.64 {d31}, [r1], r2 |
bx lr |
- ENDP ; |vp9_short_idct16x16_add_neon_pass1| |
+ ENDP ; |vp9_idct16x16_256_add_neon_pass1| |
-;void vp9_short_idct16x16_add_neon_pass2(int16_t *src, |
+;void vp9_idct16x16_256_add_neon_pass2(int16_t *src, |
; int16_t *output, |
; int16_t *pass1Output, |
; int16_t skip_adding, |
@@ -294,7 +292,7 @@ |
; idct16 stage1 - stage7 on all the elements loaded in q8-q15. The output |
; will be stored back into q8-q15 registers. This function will touch q0-q7 |
; registers and use them as buffer during calculation. |
-|vp9_short_idct16x16_add_neon_pass2| PROC |
+|vp9_idct16x16_256_add_neon_pass2| PROC |
push {r3-r9} |
; TODO(hkuang): Find a better way to load the elements. |
@@ -786,9 +784,9 @@ |
end_idct16x16_pass2 |
pop {r3-r9} |
bx lr |
- ENDP ; |vp9_short_idct16x16_add_neon_pass2| |
+ ENDP ; |vp9_idct16x16_256_add_neon_pass2| |
-;void |vp9_short_idct10_16x16_add_neon_pass1|(int16_t *input, |
+;void |vp9_idct16x16_10_add_neon_pass1|(int16_t *input, |
; int16_t *output, int output_stride) |
; |
; r0 int16_t input |
@@ -798,7 +796,7 @@ |
; idct16 stage1 - stage6 on all the elements loaded in q8-q15. The output |
; will be stored back into q8-q15 registers. This function will touch q0-q7 |
; registers and use them as buffer during calculation. |
-|vp9_short_idct10_16x16_add_neon_pass1| PROC |
+|vp9_idct16x16_10_add_neon_pass1| PROC |
; TODO(hkuang): Find a better way to load the elements. |
; load elements of 0, 2, 4, 6, 8, 10, 12, 14 into q8 - q15 |
@@ -907,9 +905,9 @@ |
vst1.64 {d31}, [r1], r2 |
bx lr |
- ENDP ; |vp9_short_idct10_16x16_add_neon_pass1| |
+ ENDP ; |vp9_idct16x16_10_add_neon_pass1| |
-;void vp9_short_idct10_16x16_add_neon_pass2(int16_t *src, |
+;void vp9_idct16x16_10_add_neon_pass2(int16_t *src, |
; int16_t *output, |
; int16_t *pass1Output, |
; int16_t skip_adding, |
@@ -926,7 +924,7 @@ |
; idct16 stage1 - stage7 on all the elements loaded in q8-q15. The output |
; will be stored back into q8-q15 registers. This function will touch q0-q7 |
; registers and use them as buffer during calculation. |
-|vp9_short_idct10_16x16_add_neon_pass2| PROC |
+|vp9_idct16x16_10_add_neon_pass2| PROC |
push {r3-r9} |
; TODO(hkuang): Find a better way to load the elements. |
@@ -1177,15 +1175,5 @@ |
end_idct10_16x16_pass2 |
pop {r3-r9} |
bx lr |
- ENDP ; |vp9_short_idct10_16x16_add_neon_pass2| |
-;void |save_neon_registers|() |
-|save_neon_registers| PROC |
- vpush {d8-d15} |
- bx lr |
- ENDP ; |save_registers| |
-;void |restore_neon_registers|() |
-|restore_neon_registers| PROC |
- vpop {d8-d15} |
- bx lr |
- ENDP ; |restore_registers| |
+ ENDP ; |vp9_idct16x16_10_add_neon_pass2| |
END |