Index: source/libvpx/vp9/common/vp9_rtcd_defs.pl |
=================================================================== |
--- source/libvpx/vp9/common/vp9_rtcd_defs.pl (revision 290053) |
+++ source/libvpx/vp9/common/vp9_rtcd_defs.pl (working copy) |
@@ -414,13 +414,13 @@ |
specialize qw/vp9_variance32x64/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_variance32x32/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
-specialize qw/vp9_variance32x32 avx2/, "$sse2_x86inc"; |
+specialize qw/vp9_variance32x32 avx2 neon/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_variance64x64/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
specialize qw/vp9_variance64x64 avx2/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_variance16x16/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
-specialize qw/vp9_variance16x16 mmx avx2/, "$sse2_x86inc"; |
+specialize qw/vp9_variance16x16 mmx avx2 neon/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_variance16x8/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
specialize qw/vp9_variance16x8 mmx/, "$sse2_x86inc"; |
@@ -429,13 +429,13 @@ |
specialize qw/vp9_variance8x16 mmx/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_variance8x8/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
-specialize qw/vp9_variance8x8 mmx/, "$sse2_x86inc"; |
+specialize qw/vp9_variance8x8 mmx neon/, "$sse2_x86inc"; |
add_proto qw/void vp9_get8x8var/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, int *sum"; |
-specialize qw/vp9_get8x8var mmx/, "$sse2_x86inc"; |
+specialize qw/vp9_get8x8var mmx neon/, "$sse2_x86inc"; |
add_proto qw/void vp9_get16x16var/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, int *sum"; |
-specialize qw/vp9_get16x16var avx2/, "$sse2_x86inc"; |
+specialize qw/vp9_get16x16var avx2 neon/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_variance8x4/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
specialize qw/vp9_variance8x4/, "$sse2_x86inc"; |
@@ -447,10 +447,10 @@ |
specialize qw/vp9_variance4x4 mmx/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_variance64x64/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
-specialize qw/vp9_sub_pixel_variance64x64/, "$sse2_x86inc", "$ssse3_x86inc"; |
+specialize qw/vp9_sub_pixel_variance64x64 avx2/, "$sse2_x86inc", "$ssse3_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_avg_variance64x64/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred"; |
-specialize qw/vp9_sub_pixel_avg_variance64x64/, "$sse2_x86inc", "$ssse3_x86inc"; |
+specialize qw/vp9_sub_pixel_avg_variance64x64 avx2/, "$sse2_x86inc", "$ssse3_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_variance32x64/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
specialize qw/vp9_sub_pixel_variance32x64/, "$sse2_x86inc", "$ssse3_x86inc"; |
@@ -477,13 +477,13 @@ |
specialize qw/vp9_sub_pixel_avg_variance16x32/, "$sse2_x86inc", "$ssse3_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_variance32x32/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
-specialize qw/vp9_sub_pixel_variance32x32/, "$sse2_x86inc", "$ssse3_x86inc"; |
+specialize qw/vp9_sub_pixel_variance32x32 avx2 neon/, "$sse2_x86inc", "$ssse3_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_avg_variance32x32/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred"; |
-specialize qw/vp9_sub_pixel_avg_variance32x32/, "$sse2_x86inc", "$ssse3_x86inc"; |
+specialize qw/vp9_sub_pixel_avg_variance32x32 avx2/, "$sse2_x86inc", "$ssse3_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_variance16x16/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
-specialize qw/vp9_sub_pixel_variance16x16/, "$sse2_x86inc", "$ssse3_x86inc"; |
+specialize qw/vp9_sub_pixel_variance16x16 neon/, "$sse2_x86inc", "$ssse3_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_avg_variance16x16/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred"; |
specialize qw/vp9_sub_pixel_avg_variance16x16/, "$sse2_x86inc", "$ssse3_x86inc"; |
@@ -501,7 +501,7 @@ |
specialize qw/vp9_sub_pixel_avg_variance16x8/, "$sse2_x86inc", "$ssse3_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_variance8x8/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
-specialize qw/vp9_sub_pixel_variance8x8/, "$sse2_x86inc", "$ssse3_x86inc"; |
+specialize qw/vp9_sub_pixel_variance8x8 neon/, "$sse2_x86inc", "$ssse3_x86inc"; |
add_proto qw/unsigned int vp9_sub_pixel_avg_variance8x8/, "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred"; |
specialize qw/vp9_sub_pixel_avg_variance8x8/, "$sse2_x86inc", "$ssse3_x86inc"; |
@@ -554,7 +554,7 @@ |
specialize qw/vp9_sad8x16 mmx/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_sad8x8/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride"; |
-specialize qw/vp9_sad8x8 mmx/, "$sse2_x86inc"; |
+specialize qw/vp9_sad8x8 mmx neon/, "$sse2_x86inc"; |
add_proto qw/unsigned int vp9_sad8x4/, "const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride"; |
specialize qw/vp9_sad8x4/, "$sse2_x86inc"; |
@@ -653,7 +653,7 @@ |
specialize qw/vp9_sad4x4x8 sse4/; |
add_proto qw/void vp9_sad64x64x4d/, "const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array"; |
-specialize qw/vp9_sad64x64x4d sse2/; |
+specialize qw/vp9_sad64x64x4d sse2 avx2/; |
add_proto qw/void vp9_sad32x64x4d/, "const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array"; |
specialize qw/vp9_sad32x64x4d sse2/; |
@@ -668,7 +668,7 @@ |
specialize qw/vp9_sad16x32x4d sse2/; |
add_proto qw/void vp9_sad32x32x4d/, "const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array"; |
-specialize qw/vp9_sad32x32x4d sse2/; |
+specialize qw/vp9_sad32x32x4d sse2 avx2/; |
add_proto qw/void vp9_sad16x16x4d/, "const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array"; |
specialize qw/vp9_sad16x16x4d sse2/; |
@@ -712,10 +712,10 @@ |
specialize qw/vp9_block_error avx2/, "$sse2_x86inc"; |
add_proto qw/void vp9_subtract_block/, "int rows, int cols, int16_t *diff_ptr, ptrdiff_t diff_stride, const uint8_t *src_ptr, ptrdiff_t src_stride, const uint8_t *pred_ptr, ptrdiff_t pred_stride"; |
-specialize qw/vp9_subtract_block/, "$sse2_x86inc"; |
+specialize qw/vp9_subtract_block neon/, "$sse2_x86inc"; |
add_proto qw/void vp9_quantize_fp/, "const int16_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, int16_t *qcoeff_ptr, int16_t *dqcoeff_ptr, const int16_t *dequant_ptr, int zbin_oq_value, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan"; |
-specialize qw/vp9_quantize_fp/, "$ssse3_x86_64"; |
+specialize qw/vp9_quantize_fp neon/, "$ssse3_x86_64"; |
add_proto qw/void vp9_quantize_fp_32x32/, "const int16_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, int16_t *qcoeff_ptr, int16_t *dqcoeff_ptr, const int16_t *dequant_ptr, int zbin_oq_value, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan"; |
specialize qw/vp9_quantize_fp_32x32/, "$ssse3_x86_64"; |
@@ -739,10 +739,10 @@ |
# fdct functions |
add_proto qw/void vp9_fht4x4/, "const int16_t *input, int16_t *output, int stride, int tx_type"; |
-specialize qw/vp9_fht4x4 sse2 avx2/; |
+specialize qw/vp9_fht4x4 sse2/; |
add_proto qw/void vp9_fht8x8/, "const int16_t *input, int16_t *output, int stride, int tx_type"; |
-specialize qw/vp9_fht8x8 sse2 avx2/; |
+specialize qw/vp9_fht8x8 sse2/; |
add_proto qw/void vp9_fht16x16/, "const int16_t *input, int16_t *output, int stride, int tx_type"; |
specialize qw/vp9_fht16x16 sse2/; |
@@ -754,13 +754,13 @@ |
specialize qw/vp9_fdct4x4_1 sse2/; |
add_proto qw/void vp9_fdct4x4/, "const int16_t *input, int16_t *output, int stride"; |
-specialize qw/vp9_fdct4x4 sse2 avx2/; |
+specialize qw/vp9_fdct4x4 sse2/; |
add_proto qw/void vp9_fdct8x8_1/, "const int16_t *input, int16_t *output, int stride"; |
-specialize qw/vp9_fdct8x8_1 sse2/; |
+specialize qw/vp9_fdct8x8_1 sse2 neon/; |
add_proto qw/void vp9_fdct8x8/, "const int16_t *input, int16_t *output, int stride"; |
-specialize qw/vp9_fdct8x8 sse2 avx2/, "$ssse3_x86_64"; |
+specialize qw/vp9_fdct8x8 sse2 neon/, "$ssse3_x86_64"; |
add_proto qw/void vp9_fdct16x16_1/, "const int16_t *input, int16_t *output, int stride"; |
specialize qw/vp9_fdct16x16_1 sse2/; |