| Index: source/libvpx/vp9/common/vp9_rtcd_defs.pl
|
| diff --git a/source/libvpx/vp9/common/vp9_rtcd_defs.pl b/source/libvpx/vp9/common/vp9_rtcd_defs.pl
|
| index 638b836730831bcd779d4e8f55def49c09764561..bbe200d0d6327fc7dafc62e85d5b04b1aba0ddb9 100644
|
| --- a/source/libvpx/vp9/common/vp9_rtcd_defs.pl
|
| +++ b/source/libvpx/vp9/common/vp9_rtcd_defs.pl
|
| @@ -216,44 +216,44 @@ specialize qw/vp9_dc_128_predictor_32x32/, "$sse2_x86inc";
|
| # Loopfilter
|
| #
|
| add_proto qw/void vp9_lpf_vertical_16/, "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh";
|
| -specialize qw/vp9_lpf_vertical_16 sse2 neon_asm dspr2/;
|
| +specialize qw/vp9_lpf_vertical_16 sse2 neon_asm dspr2 msa/;
|
| $vp9_lpf_vertical_16_neon_asm=vp9_lpf_vertical_16_neon;
|
|
|
| add_proto qw/void vp9_lpf_vertical_16_dual/, "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh";
|
| -specialize qw/vp9_lpf_vertical_16_dual sse2 neon_asm dspr2/;
|
| +specialize qw/vp9_lpf_vertical_16_dual sse2 neon_asm dspr2 msa/;
|
| $vp9_lpf_vertical_16_dual_neon_asm=vp9_lpf_vertical_16_dual_neon;
|
|
|
| add_proto qw/void vp9_lpf_vertical_8/, "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count";
|
| -specialize qw/vp9_lpf_vertical_8 sse2 neon_asm dspr2/;
|
| +specialize qw/vp9_lpf_vertical_8 sse2 neon_asm dspr2 msa/;
|
| $vp9_lpf_vertical_8_neon_asm=vp9_lpf_vertical_8_neon;
|
|
|
| add_proto qw/void vp9_lpf_vertical_8_dual/, "uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1";
|
| -specialize qw/vp9_lpf_vertical_8_dual sse2 neon_asm dspr2/;
|
| +specialize qw/vp9_lpf_vertical_8_dual sse2 neon_asm dspr2 msa/;
|
| $vp9_lpf_vertical_8_dual_neon_asm=vp9_lpf_vertical_8_dual_neon;
|
|
|
| add_proto qw/void vp9_lpf_vertical_4/, "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count";
|
| -specialize qw/vp9_lpf_vertical_4 mmx neon dspr2/;
|
| +specialize qw/vp9_lpf_vertical_4 mmx neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_lpf_vertical_4_dual/, "uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1";
|
| -specialize qw/vp9_lpf_vertical_4_dual sse2 neon dspr2/;
|
| +specialize qw/vp9_lpf_vertical_4_dual sse2 neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_lpf_horizontal_16/, "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count";
|
| -specialize qw/vp9_lpf_horizontal_16 sse2 avx2 neon_asm dspr2/;
|
| +specialize qw/vp9_lpf_horizontal_16 sse2 avx2 neon_asm dspr2 msa/;
|
| $vp9_lpf_horizontal_16_neon_asm=vp9_lpf_horizontal_16_neon;
|
|
|
| add_proto qw/void vp9_lpf_horizontal_8/, "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count";
|
| -specialize qw/vp9_lpf_horizontal_8 sse2 neon_asm dspr2/;
|
| +specialize qw/vp9_lpf_horizontal_8 sse2 neon_asm dspr2 msa/;
|
| $vp9_lpf_horizontal_8_neon_asm=vp9_lpf_horizontal_8_neon;
|
|
|
| add_proto qw/void vp9_lpf_horizontal_8_dual/, "uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1";
|
| -specialize qw/vp9_lpf_horizontal_8_dual sse2 neon_asm dspr2/;
|
| +specialize qw/vp9_lpf_horizontal_8_dual sse2 neon_asm dspr2 msa/;
|
| $vp9_lpf_horizontal_8_dual_neon_asm=vp9_lpf_horizontal_8_dual_neon;
|
|
|
| add_proto qw/void vp9_lpf_horizontal_4/, "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count";
|
| -specialize qw/vp9_lpf_horizontal_4 mmx neon dspr2/;
|
| +specialize qw/vp9_lpf_horizontal_4 mmx neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_lpf_horizontal_4_dual/, "uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1";
|
| -specialize qw/vp9_lpf_horizontal_4_dual sse2 neon dspr2/;
|
| +specialize qw/vp9_lpf_horizontal_4_dual sse2 neon dspr2 msa/;
|
|
|
| #
|
| # post proc
|
| @@ -286,28 +286,28 @@ specialize qw/vp9_filter_by_weight8x8 sse2/;
|
| # Sub Pixel Filters
|
| #
|
| add_proto qw/void vp9_convolve_copy/, "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h";
|
| -specialize qw/vp9_convolve_copy neon dspr2/, "$sse2_x86inc";
|
| +specialize qw/vp9_convolve_copy neon dspr2 msa/, "$sse2_x86inc";
|
|
|
| add_proto qw/void vp9_convolve_avg/, "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h";
|
| -specialize qw/vp9_convolve_avg neon dspr2/, "$sse2_x86inc";
|
| +specialize qw/vp9_convolve_avg neon dspr2 msa/, "$sse2_x86inc";
|
|
|
| add_proto qw/void vp9_convolve8/, "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h";
|
| -specialize qw/vp9_convolve8 sse2 ssse3 neon dspr2/, "$avx2_ssse3";
|
| +specialize qw/vp9_convolve8 sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3";
|
|
|
| add_proto qw/void vp9_convolve8_horiz/, "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h";
|
| -specialize qw/vp9_convolve8_horiz sse2 ssse3 neon dspr2/, "$avx2_ssse3";
|
| +specialize qw/vp9_convolve8_horiz sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3";
|
|
|
| add_proto qw/void vp9_convolve8_vert/, "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h";
|
| -specialize qw/vp9_convolve8_vert sse2 ssse3 neon dspr2/, "$avx2_ssse3";
|
| +specialize qw/vp9_convolve8_vert sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3";
|
|
|
| add_proto qw/void vp9_convolve8_avg/, "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h";
|
| -specialize qw/vp9_convolve8_avg sse2 ssse3 neon dspr2/;
|
| +specialize qw/vp9_convolve8_avg sse2 ssse3 neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_convolve8_avg_horiz/, "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h";
|
| -specialize qw/vp9_convolve8_avg_horiz sse2 ssse3 neon dspr2/;
|
| +specialize qw/vp9_convolve8_avg_horiz sse2 ssse3 neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_convolve8_avg_vert/, "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h";
|
| -specialize qw/vp9_convolve8_avg_vert sse2 ssse3 neon dspr2/;
|
| +specialize qw/vp9_convolve8_avg_vert sse2 ssse3 neon dspr2 msa/;
|
|
|
| #
|
| # dct
|
| @@ -419,10 +419,10 @@ if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") {
|
| specialize qw/vp9_iwht4x4_16_add/;
|
| } else {
|
| add_proto qw/void vp9_idct4x4_1_add/, "const tran_low_t *input, uint8_t *dest, int dest_stride";
|
| - specialize qw/vp9_idct4x4_1_add sse2 neon dspr2/;
|
| + specialize qw/vp9_idct4x4_1_add sse2 neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_idct4x4_16_add/, "const tran_low_t *input, uint8_t *dest, int dest_stride";
|
| - specialize qw/vp9_idct4x4_16_add sse2 neon dspr2/;
|
| + specialize qw/vp9_idct4x4_16_add sse2 neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_idct8x8_1_add/, "const tran_low_t *input, uint8_t *dest, int dest_stride";
|
| specialize qw/vp9_idct8x8_1_add sse2 neon dspr2 msa/;
|
| @@ -454,7 +454,7 @@ if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") {
|
| specialize qw/vp9_idct32x32_1_add sse2 neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_iht4x4_16_add/, "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type";
|
| - specialize qw/vp9_iht4x4_16_add sse2 neon dspr2/;
|
| + specialize qw/vp9_iht4x4_16_add sse2 neon dspr2 msa/;
|
|
|
| add_proto qw/void vp9_iht8x8_64_add/, "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type";
|
| specialize qw/vp9_iht8x8_64_add sse2 neon dspr2 msa/;
|
| @@ -465,10 +465,10 @@ if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") {
|
| # dct and add
|
|
|
| add_proto qw/void vp9_iwht4x4_1_add/, "const tran_low_t *input, uint8_t *dest, int dest_stride";
|
| - specialize qw/vp9_iwht4x4_1_add/;
|
| + specialize qw/vp9_iwht4x4_1_add msa/;
|
|
|
| add_proto qw/void vp9_iwht4x4_16_add/, "const tran_low_t *input, uint8_t *dest, int dest_stride";
|
| - specialize qw/vp9_iwht4x4_16_add/;
|
| + specialize qw/vp9_iwht4x4_16_add msa/;
|
| }
|
| }
|
|
|
|
|