| Index: source/libvpx/vp8/common/x86/subpixel_ssse3.asm
|
| ===================================================================
|
| --- source/libvpx/vp8/common/x86/subpixel_ssse3.asm (revision 96967)
|
| +++ source/libvpx/vp8/common/x86/subpixel_ssse3.asm (working copy)
|
| @@ -39,6 +39,7 @@
|
| push rbp
|
| mov rbp, rsp
|
| SHADOW_ARGS_TO_STACK 6
|
| + SAVE_XMM 7
|
| GET_GOT rbx
|
| push rsi
|
| push rdi
|
| @@ -107,6 +108,7 @@
|
| pop rdi
|
| pop rsi
|
| RESTORE_GOT
|
| + RESTORE_XMM
|
| UNSHADOW_ARGS
|
| pop rbp
|
| ret
|
| @@ -162,6 +164,7 @@
|
| pop rdi
|
| pop rsi
|
| RESTORE_GOT
|
| + RESTORE_XMM
|
| UNSHADOW_ARGS
|
| pop rbp
|
| ret
|
| @@ -179,7 +182,7 @@
|
| push rbp
|
| mov rbp, rsp
|
| SHADOW_ARGS_TO_STACK 6
|
| - SAVE_XMM
|
| + SAVE_XMM 7
|
| GET_GOT rbx
|
| push rsi
|
| push rdi
|
| @@ -194,10 +197,6 @@
|
|
|
| mov rdi, arg(2) ;output_ptr
|
|
|
| -;;
|
| -;; cmp esi, DWORD PTR [rax]
|
| -;; je vp8_filter_block1d16_h4_ssse3
|
| -
|
| mov rsi, arg(0) ;src_ptr
|
|
|
| movdqa xmm4, XMMWORD PTR [rax] ;k0_k5
|
| @@ -271,65 +270,11 @@
|
| pop rdi
|
| pop rsi
|
| RESTORE_GOT
|
| + RESTORE_XMM
|
| UNSHADOW_ARGS
|
| pop rbp
|
| ret
|
|
|
| -vp8_filter_block1d16_h4_ssse3:
|
| - movdqa xmm5, XMMWORD PTR [rax+256] ;k2_k4
|
| - movdqa xmm6, XMMWORD PTR [rax+128] ;k1_k3
|
| -
|
| - mov rsi, arg(0) ;src_ptr
|
| - movsxd rax, dword ptr arg(1) ;src_pixels_per_line
|
| - movsxd rcx, dword ptr arg(4) ;output_height
|
| - movsxd rdx, dword ptr arg(3) ;output_pitch
|
| -
|
| -filter_block1d16_h4_rowloop_ssse3:
|
| - movdqu xmm1, XMMWORD PTR [rsi - 2]
|
| -
|
| - movdqa xmm2, xmm1
|
| - pshufb xmm1, [GLOBAL(shuf2b)]
|
| - pshufb xmm2, [GLOBAL(shuf3b)]
|
| - pmaddubsw xmm1, xmm5
|
| -
|
| - movdqu xmm3, XMMWORD PTR [rsi + 6]
|
| -
|
| - pmaddubsw xmm2, xmm6
|
| - movdqa xmm0, xmm3
|
| - pshufb xmm3, [GLOBAL(shuf3b)]
|
| - pshufb xmm0, [GLOBAL(shuf2b)]
|
| -
|
| - paddsw xmm1, [GLOBAL(rd)]
|
| - paddsw xmm1, xmm2
|
| -
|
| - pmaddubsw xmm0, xmm5
|
| - pmaddubsw xmm3, xmm6
|
| -
|
| - psraw xmm1, 7
|
| - packuswb xmm1, xmm1
|
| - lea rsi, [rsi + rax]
|
| - paddsw xmm3, xmm0
|
| - paddsw xmm3, [GLOBAL(rd)]
|
| - psraw xmm3, 7
|
| - packuswb xmm3, xmm3
|
| -
|
| - punpcklqdq xmm1, xmm3
|
| -
|
| - movdqa XMMWORD Ptr [rdi], xmm1
|
| -
|
| - add rdi, rdx
|
| - dec rcx
|
| - jnz filter_block1d16_h4_rowloop_ssse3
|
| -
|
| -
|
| - ; begin epilog
|
| - pop rdi
|
| - pop rsi
|
| - RESTORE_GOT
|
| - UNSHADOW_ARGS
|
| - pop rbp
|
| - ret
|
| -
|
| ;void vp8_filter_block1d4_h6_ssse3
|
| ;(
|
| ; unsigned char *src_ptr,
|
| @@ -344,6 +289,7 @@
|
| push rbp
|
| mov rbp, rsp
|
| SHADOW_ARGS_TO_STACK 6
|
| + SAVE_XMM 7
|
| GET_GOT rbx
|
| push rsi
|
| push rdi
|
| @@ -451,6 +397,7 @@
|
| pop rdi
|
| pop rsi
|
| RESTORE_GOT
|
| + RESTORE_XMM
|
| UNSHADOW_ARGS
|
| pop rbp
|
| ret
|
| @@ -471,6 +418,7 @@
|
| push rbp
|
| mov rbp, rsp
|
| SHADOW_ARGS_TO_STACK 6
|
| + SAVE_XMM 7
|
| GET_GOT rbx
|
| push rsi
|
| push rdi
|
| @@ -566,6 +514,7 @@
|
| pop rdi
|
| pop rsi
|
| RESTORE_GOT
|
| + RESTORE_XMM
|
| UNSHADOW_ARGS
|
| pop rbp
|
| ret
|
| @@ -638,6 +587,7 @@
|
| pop rdi
|
| pop rsi
|
| RESTORE_GOT
|
| + RESTORE_XMM
|
| UNSHADOW_ARGS
|
| pop rbp
|
| ret
|
| @@ -656,6 +606,7 @@
|
| push rbp
|
| mov rbp, rsp
|
| SHADOW_ARGS_TO_STACK 6
|
| + SAVE_XMM 7
|
| GET_GOT rbx
|
| push rsi
|
| push rdi
|
| @@ -728,6 +679,7 @@
|
| pop rdi
|
| pop rsi
|
| RESTORE_GOT
|
| + RESTORE_XMM
|
| UNSHADOW_ARGS
|
| pop rbp
|
| ret
|
| @@ -776,6 +728,7 @@
|
| pop rdi
|
| pop rsi
|
| RESTORE_GOT
|
| + RESTORE_XMM
|
| UNSHADOW_ARGS
|
| pop rbp
|
| ret
|
| @@ -932,7 +885,7 @@
|
| push rbp
|
| mov rbp, rsp
|
| SHADOW_ARGS_TO_STACK 6
|
| - SAVE_XMM
|
| + SAVE_XMM 7
|
| GET_GOT rbx
|
| push rsi
|
| push rdi
|
| @@ -1195,7 +1148,7 @@
|
| push rbp
|
| mov rbp, rsp
|
| SHADOW_ARGS_TO_STACK 6
|
| - SAVE_XMM
|
| + SAVE_XMM 7
|
| GET_GOT rbx
|
| push rsi
|
| push rdi
|
|
|