| OLD | NEW | 
|---|
| 1 ; | 1 ; | 
| 2 ;  Copyright (c) 2010 The WebM project authors. All Rights Reserved. | 2 ;  Copyright (c) 2010 The WebM project authors. All Rights Reserved. | 
| 3 ; | 3 ; | 
| 4 ;  Use of this source code is governed by a BSD-style license | 4 ;  Use of this source code is governed by a BSD-style license | 
| 5 ;  that can be found in the LICENSE file in the root of the source | 5 ;  that can be found in the LICENSE file in the root of the source | 
| 6 ;  tree. An additional intellectual property rights grant can be found | 6 ;  tree. An additional intellectual property rights grant can be found | 
| 7 ;  in the file PATENTS.  All contributing project authors may | 7 ;  in the file PATENTS.  All contributing project authors may | 
| 8 ;  be found in the AUTHORS file in the root of the source tree. | 8 ;  be found in the AUTHORS file in the root of the source tree. | 
| 9 ; | 9 ; | 
| 10 | 10 | 
| 11 | 11 | 
| 12 %include "vpx_ports/x86_abi_support.asm" | 12 %include "vpx_ports/x86_abi_support.asm" | 
| 13 | 13 | 
| 14 ;void vp8_post_proc_down_and_across_xmm | 14 ;void vp8_post_proc_down_and_across_xmm | 
| 15 ;( | 15 ;( | 
| 16 ;    unsigned char *src_ptr, | 16 ;    unsigned char *src_ptr, | 
| 17 ;    unsigned char *dst_ptr, | 17 ;    unsigned char *dst_ptr, | 
| 18 ;    int src_pixels_per_line, | 18 ;    int src_pixels_per_line, | 
| 19 ;    int dst_pixels_per_line, | 19 ;    int dst_pixels_per_line, | 
| 20 ;    int rows, | 20 ;    int rows, | 
| 21 ;    int cols, | 21 ;    int cols, | 
| 22 ;    int flimit | 22 ;    int flimit | 
| 23 ;) | 23 ;) | 
| 24 global sym(vp8_post_proc_down_and_across_xmm) | 24 global sym(vp8_post_proc_down_and_across_xmm) | 
| 25 sym(vp8_post_proc_down_and_across_xmm): | 25 sym(vp8_post_proc_down_and_across_xmm): | 
| 26     push        rbp | 26     push        rbp | 
| 27     mov         rbp, rsp | 27     mov         rbp, rsp | 
| 28     SHADOW_ARGS_TO_STACK 7 | 28     SHADOW_ARGS_TO_STACK 7 | 
| 29     SAVE_XMM | 29     SAVE_XMM 7 | 
| 30     GET_GOT     rbx | 30     GET_GOT     rbx | 
| 31     push        rsi | 31     push        rsi | 
| 32     push        rdi | 32     push        rdi | 
| 33     ; end prolog | 33     ; end prolog | 
| 34 | 34 | 
| 35 %if ABI_IS_32BIT=1 && CONFIG_PIC=1 | 35 %if ABI_IS_32BIT=1 && CONFIG_PIC=1 | 
| 36     ALIGN_STACK 16, rax | 36     ALIGN_STACK 16, rax | 
| 37     ; move the global rd onto the stack, since we don't have enough registers | 37     ; move the global rd onto the stack, since we don't have enough registers | 
| 38     ; to do PIC addressing | 38     ; to do PIC addressing | 
| 39     movdqa      xmm0, [GLOBAL(rd42)] | 39     movdqa      xmm0, [GLOBAL(rd42)] | 
| (...skipping 209 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 249 | 249 | 
| 250 | 250 | 
| 251 ;void vp8_mbpost_proc_down_xmm(unsigned char *dst, | 251 ;void vp8_mbpost_proc_down_xmm(unsigned char *dst, | 
| 252 ;                            int pitch, int rows, int cols,int flimit) | 252 ;                            int pitch, int rows, int cols,int flimit) | 
| 253 extern sym(vp8_rv) | 253 extern sym(vp8_rv) | 
| 254 global sym(vp8_mbpost_proc_down_xmm) | 254 global sym(vp8_mbpost_proc_down_xmm) | 
| 255 sym(vp8_mbpost_proc_down_xmm): | 255 sym(vp8_mbpost_proc_down_xmm): | 
| 256     push        rbp | 256     push        rbp | 
| 257     mov         rbp, rsp | 257     mov         rbp, rsp | 
| 258     SHADOW_ARGS_TO_STACK 5 | 258     SHADOW_ARGS_TO_STACK 5 | 
| 259     SAVE_XMM | 259     SAVE_XMM 7 | 
| 260     GET_GOT     rbx | 260     GET_GOT     rbx | 
| 261     push        rsi | 261     push        rsi | 
| 262     push        rdi | 262     push        rdi | 
| 263     ; end prolog | 263     ; end prolog | 
| 264 | 264 | 
| 265     ALIGN_STACK 16, rax | 265     ALIGN_STACK 16, rax | 
| 266     sub         rsp, 128+16 | 266     sub         rsp, 128+16 | 
| 267 | 267 | 
| 268     ; unsigned char d[16][8] at [rsp] | 268     ; unsigned char d[16][8] at [rsp] | 
| 269     ; create flimit2 at [rsp+128] | 269     ; create flimit2 at [rsp+128] | 
| (...skipping 179 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 449 %undef flimit4 | 449 %undef flimit4 | 
| 450 | 450 | 
| 451 | 451 | 
| 452 ;void vp8_mbpost_proc_across_ip_xmm(unsigned char *src, | 452 ;void vp8_mbpost_proc_across_ip_xmm(unsigned char *src, | 
| 453 ;                                int pitch, int rows, int cols,int flimit) | 453 ;                                int pitch, int rows, int cols,int flimit) | 
| 454 global sym(vp8_mbpost_proc_across_ip_xmm) | 454 global sym(vp8_mbpost_proc_across_ip_xmm) | 
| 455 sym(vp8_mbpost_proc_across_ip_xmm): | 455 sym(vp8_mbpost_proc_across_ip_xmm): | 
| 456     push        rbp | 456     push        rbp | 
| 457     mov         rbp, rsp | 457     mov         rbp, rsp | 
| 458     SHADOW_ARGS_TO_STACK 5 | 458     SHADOW_ARGS_TO_STACK 5 | 
| 459     SAVE_XMM | 459     SAVE_XMM 7 | 
| 460     GET_GOT     rbx | 460     GET_GOT     rbx | 
| 461     push        rsi | 461     push        rsi | 
| 462     push        rdi | 462     push        rdi | 
| 463     ; end prolog | 463     ; end prolog | 
| 464 | 464 | 
| 465     ALIGN_STACK 16, rax | 465     ALIGN_STACK 16, rax | 
| 466     sub         rsp, 16 | 466     sub         rsp, 16 | 
| 467 | 467 | 
| 468     ; create flimit4 at [rsp] | 468     ; create flimit4 at [rsp] | 
| 469     mov         eax, dword ptr arg(4) ;flimit | 469     mov         eax, dword ptr arg(4) ;flimit | 
| (...skipping 216 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 686     pop         rbp | 686     pop         rbp | 
| 687     ret | 687     ret | 
| 688 | 688 | 
| 689 | 689 | 
| 690 SECTION_RODATA | 690 SECTION_RODATA | 
| 691 align 16 | 691 align 16 | 
| 692 rd42: | 692 rd42: | 
| 693     times 8 dw 0x04 | 693     times 8 dw 0x04 | 
| 694 four8s: | 694 four8s: | 
| 695     times 4 dd 8 | 695     times 4 dd 8 | 
| OLD | NEW | 
|---|