Index: source/libvpx/vp8/common/ppc/sad_altivec.asm |
diff --git a/source/libvpx/vp8/common/ppc/sad_altivec.asm b/source/libvpx/vp8/common/ppc/sad_altivec.asm |
deleted file mode 100644 |
index e5f26380f96be5c0dc615db4113a8dff88d0d119..0000000000000000000000000000000000000000 |
--- a/source/libvpx/vp8/common/ppc/sad_altivec.asm |
+++ /dev/null |
@@ -1,277 +0,0 @@ |
-; |
-; Copyright (c) 2010 The WebM project authors. All Rights Reserved. |
-; |
-; Use of this source code is governed by a BSD-style license |
-; that can be found in the LICENSE file in the root of the source |
-; tree. An additional intellectual property rights grant can be found |
-; in the file PATENTS. All contributing project authors may |
-; be found in the AUTHORS file in the root of the source tree. |
-; |
- |
- |
- .globl vp8_sad16x16_ppc |
- .globl vp8_sad16x8_ppc |
- .globl vp8_sad8x16_ppc |
- .globl vp8_sad8x8_ppc |
- .globl vp8_sad4x4_ppc |
- |
-.macro load_aligned_16 V R O |
- lvsl v3, 0, \R ;# permutate value for alignment |
- |
- lvx v1, 0, \R |
- lvx v2, \O, \R |
- |
- vperm \V, v1, v2, v3 |
-.endm |
- |
-.macro prologue |
- mfspr r11, 256 ;# get old VRSAVE |
- oris r12, r11, 0xffc0 |
- mtspr 256, r12 ;# set VRSAVE |
- |
- stwu r1, -32(r1) ;# create space on the stack |
- |
- li r10, 16 ;# load offset and loop counter |
- |
- vspltisw v8, 0 ;# zero out total to start |
-.endm |
- |
-.macro epilogue |
- addi r1, r1, 32 ;# recover stack |
- |
- mtspr 256, r11 ;# reset old VRSAVE |
-.endm |
- |
-.macro SAD_16 |
- ;# v6 = abs (v4 - v5) |
- vsububs v6, v4, v5 |
- vsububs v7, v5, v4 |
- vor v6, v6, v7 |
- |
- ;# v8 += abs (v4 - v5) |
- vsum4ubs v8, v6, v8 |
-.endm |
- |
-.macro sad_16_loop loop_label |
- lvsl v3, 0, r5 ;# only needs to be done once per block |
- |
- ;# preload a line of data before getting into the loop |
- lvx v4, 0, r3 |
- lvx v1, 0, r5 |
- lvx v2, r10, r5 |
- |
- add r5, r5, r6 |
- add r3, r3, r4 |
- |
- vperm v5, v1, v2, v3 |
- |
- .align 4 |
-\loop_label: |
- ;# compute difference on first row |
- vsububs v6, v4, v5 |
- vsububs v7, v5, v4 |
- |
- ;# load up next set of data |
- lvx v9, 0, r3 |
- lvx v1, 0, r5 |
- lvx v2, r10, r5 |
- |
- ;# perform abs() of difference |
- vor v6, v6, v7 |
- add r3, r3, r4 |
- |
- ;# add to the running tally |
- vsum4ubs v8, v6, v8 |
- |
- ;# now onto the next line |
- vperm v5, v1, v2, v3 |
- add r5, r5, r6 |
- lvx v4, 0, r3 |
- |
- ;# compute difference on second row |
- vsububs v6, v9, v5 |
- lvx v1, 0, r5 |
- vsububs v7, v5, v9 |
- lvx v2, r10, r5 |
- vor v6, v6, v7 |
- add r3, r3, r4 |
- vsum4ubs v8, v6, v8 |
- vperm v5, v1, v2, v3 |
- add r5, r5, r6 |
- |
- bdnz \loop_label |
- |
- vspltisw v7, 0 |
- |
- vsumsws v8, v8, v7 |
- |
- stvx v8, 0, r1 |
- lwz r3, 12(r1) |
-.endm |
- |
-.macro sad_8_loop loop_label |
- .align 4 |
-\loop_label: |
- ;# only one of the inputs should need to be aligned. |
- load_aligned_16 v4, r3, r10 |
- load_aligned_16 v5, r5, r10 |
- |
- ;# move onto the next line |
- add r3, r3, r4 |
- add r5, r5, r6 |
- |
- ;# only one of the inputs should need to be aligned. |
- load_aligned_16 v6, r3, r10 |
- load_aligned_16 v7, r5, r10 |
- |
- ;# move onto the next line |
- add r3, r3, r4 |
- add r5, r5, r6 |
- |
- vmrghb v4, v4, v6 |
- vmrghb v5, v5, v7 |
- |
- SAD_16 |
- |
- bdnz \loop_label |
- |
- vspltisw v7, 0 |
- |
- vsumsws v8, v8, v7 |
- |
- stvx v8, 0, r1 |
- lwz r3, 12(r1) |
-.endm |
- |
- .align 2 |
-;# r3 unsigned char *src_ptr |
-;# r4 int src_stride |
-;# r5 unsigned char *ref_ptr |
-;# r6 int ref_stride |
-;# |
-;# r3 return value |
-vp8_sad16x16_ppc: |
- |
- prologue |
- |
- li r9, 8 |
- mtctr r9 |
- |
- sad_16_loop sad16x16_loop |
- |
- epilogue |
- |
- blr |
- |
- .align 2 |
-;# r3 unsigned char *src_ptr |
-;# r4 int src_stride |
-;# r5 unsigned char *ref_ptr |
-;# r6 int ref_stride |
-;# |
-;# r3 return value |
-vp8_sad16x8_ppc: |
- |
- prologue |
- |
- li r9, 4 |
- mtctr r9 |
- |
- sad_16_loop sad16x8_loop |
- |
- epilogue |
- |
- blr |
- |
- .align 2 |
-;# r3 unsigned char *src_ptr |
-;# r4 int src_stride |
-;# r5 unsigned char *ref_ptr |
-;# r6 int ref_stride |
-;# |
-;# r3 return value |
-vp8_sad8x16_ppc: |
- |
- prologue |
- |
- li r9, 8 |
- mtctr r9 |
- |
- sad_8_loop sad8x16_loop |
- |
- epilogue |
- |
- blr |
- |
- .align 2 |
-;# r3 unsigned char *src_ptr |
-;# r4 int src_stride |
-;# r5 unsigned char *ref_ptr |
-;# r6 int ref_stride |
-;# |
-;# r3 return value |
-vp8_sad8x8_ppc: |
- |
- prologue |
- |
- li r9, 4 |
- mtctr r9 |
- |
- sad_8_loop sad8x8_loop |
- |
- epilogue |
- |
- blr |
- |
-.macro transfer_4x4 I P |
- lwz r0, 0(\I) |
- add \I, \I, \P |
- |
- lwz r7, 0(\I) |
- add \I, \I, \P |
- |
- lwz r8, 0(\I) |
- add \I, \I, \P |
- |
- lwz r9, 0(\I) |
- |
- stw r0, 0(r1) |
- stw r7, 4(r1) |
- stw r8, 8(r1) |
- stw r9, 12(r1) |
-.endm |
- |
- .align 2 |
-;# r3 unsigned char *src_ptr |
-;# r4 int src_stride |
-;# r5 unsigned char *ref_ptr |
-;# r6 int ref_stride |
-;# |
-;# r3 return value |
-vp8_sad4x4_ppc: |
- |
- prologue |
- |
- transfer_4x4 r3, r4 |
- lvx v4, 0, r1 |
- |
- transfer_4x4 r5, r6 |
- lvx v5, 0, r1 |
- |
- vspltisw v8, 0 ;# zero out total to start |
- |
- ;# v6 = abs (v4 - v5) |
- vsububs v6, v4, v5 |
- vsububs v7, v5, v4 |
- vor v6, v6, v7 |
- |
- ;# v8 += abs (v4 - v5) |
- vsum4ubs v7, v6, v8 |
- vsumsws v7, v7, v8 |
- |
- stvx v7, 0, r1 |
- lwz r3, 12(r1) |
- |
- epilogue |
- |
- blr |