| Index: source/config/mac/ia32/vp9_rtcd.h
|
| diff --git a/source/config/mac/ia32/vp9_rtcd.h b/source/config/mac/ia32/vp9_rtcd.h
|
| index 77d122a069582723543b99bab2a958c0ead13149..3559cf6ec1742de487853d290ccccafe3cab52c1 100644
|
| --- a/source/config/mac/ia32/vp9_rtcd.h
|
| +++ b/source/config/mac/ia32/vp9_rtcd.h
|
| @@ -38,11 +38,13 @@ unsigned int vp9_avg_8x8_sse2(const uint8_t *, int p);
|
| RTCD_EXTERN unsigned int (*vp9_avg_8x8)(const uint8_t *, int p);
|
|
|
| int64_t vp9_block_error_c(const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz);
|
| -#define vp9_block_error vp9_block_error_c
|
| +int64_t vp9_block_error_avx2(const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz);
|
| +RTCD_EXTERN int64_t (*vp9_block_error)(const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz);
|
|
|
| void vp9_convolve8_c(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| void vp9_convolve8_sse2(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| void vp9_convolve8_ssse3(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| +void vp9_convolve8_avx2(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| RTCD_EXTERN void (*vp9_convolve8)(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
|
|
| void vp9_convolve8_avg_c(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| @@ -63,11 +65,13 @@ RTCD_EXTERN void (*vp9_convolve8_avg_vert)(const uint8_t *src, ptrdiff_t src_str
|
| void vp9_convolve8_horiz_c(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| void vp9_convolve8_horiz_sse2(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| void vp9_convolve8_horiz_ssse3(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| +void vp9_convolve8_horiz_avx2(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| RTCD_EXTERN void (*vp9_convolve8_horiz)(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
|
|
| void vp9_convolve8_vert_c(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| void vp9_convolve8_vert_sse2(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| void vp9_convolve8_vert_ssse3(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| +void vp9_convolve8_vert_avx2(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| RTCD_EXTERN void (*vp9_convolve8_vert)(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
|
|
| void vp9_convolve_avg_c(const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h);
|
| @@ -213,6 +217,7 @@ RTCD_EXTERN void (*vp9_fdct16x16_1)(const int16_t *input, tran_low_t *output, in
|
|
|
| void vp9_fdct32x32_c(const int16_t *input, tran_low_t *output, int stride);
|
| void vp9_fdct32x32_sse2(const int16_t *input, tran_low_t *output, int stride);
|
| +void vp9_fdct32x32_avx2(const int16_t *input, tran_low_t *output, int stride);
|
| RTCD_EXTERN void (*vp9_fdct32x32)(const int16_t *input, tran_low_t *output, int stride);
|
|
|
| void vp9_fdct32x32_1_c(const int16_t *input, tran_low_t *output, int stride);
|
| @@ -221,6 +226,7 @@ RTCD_EXTERN void (*vp9_fdct32x32_1)(const int16_t *input, tran_low_t *output, in
|
|
|
| void vp9_fdct32x32_rd_c(const int16_t *input, tran_low_t *output, int stride);
|
| void vp9_fdct32x32_rd_sse2(const int16_t *input, tran_low_t *output, int stride);
|
| +void vp9_fdct32x32_rd_avx2(const int16_t *input, tran_low_t *output, int stride);
|
| RTCD_EXTERN void (*vp9_fdct32x32_rd)(const int16_t *input, tran_low_t *output, int stride);
|
|
|
| void vp9_fdct4x4_c(const int16_t *input, tran_low_t *output, int stride);
|
| @@ -268,7 +274,8 @@ void vp9_fwht4x4_c(const int16_t *input, tran_low_t *output, int stride);
|
| #define vp9_fwht4x4 vp9_fwht4x4_c
|
|
|
| void vp9_get16x16var_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, int *sum);
|
| -#define vp9_get16x16var vp9_get16x16var_c
|
| +void vp9_get16x16var_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, int *sum);
|
| +RTCD_EXTERN void (*vp9_get16x16var)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, int *sum);
|
|
|
| void vp9_get8x8var_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, int *sum);
|
| #define vp9_get8x8var vp9_get8x8var_c
|
| @@ -354,6 +361,7 @@ void vp9_iwht4x4_1_add_c(const tran_low_t *input, uint8_t *dest, int dest_stride
|
|
|
| void vp9_lpf_horizontal_16_c(uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count);
|
| void vp9_lpf_horizontal_16_sse2(uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count);
|
| +void vp9_lpf_horizontal_16_avx2(uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count);
|
| RTCD_EXTERN void (*vp9_lpf_horizontal_16)(uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count);
|
|
|
| void vp9_lpf_horizontal_4_c(uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count);
|
| @@ -397,7 +405,8 @@ void vp9_lpf_vertical_8_dual_sse2(uint8_t *s, int pitch, const uint8_t *blimit0,
|
| RTCD_EXTERN void (*vp9_lpf_vertical_8_dual)(uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1);
|
|
|
| unsigned int vp9_mse16x16_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int recon_stride, unsigned int *sse);
|
| -#define vp9_mse16x16 vp9_mse16x16_c
|
| +unsigned int vp9_mse16x16_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int recon_stride, unsigned int *sse);
|
| +RTCD_EXTERN unsigned int (*vp9_mse16x16)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int recon_stride, unsigned int *sse);
|
|
|
| unsigned int vp9_mse16x8_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int recon_stride, unsigned int *sse);
|
| #define vp9_mse16x8 vp9_mse16x8_c
|
| @@ -469,36 +478,43 @@ void vp9_sad16x8x8_c(const uint8_t *src_ptr, int src_stride, const uint8_t *ref
|
| #define vp9_sad16x8x8 vp9_sad16x8x8_c
|
|
|
| unsigned int vp9_sad32x16_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| -#define vp9_sad32x16 vp9_sad32x16_c
|
| +unsigned int vp9_sad32x16_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| +RTCD_EXTERN unsigned int (*vp9_sad32x16)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
|
|
| unsigned int vp9_sad32x16_avg_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| -#define vp9_sad32x16_avg vp9_sad32x16_avg_c
|
| +unsigned int vp9_sad32x16_avg_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| +RTCD_EXTERN unsigned int (*vp9_sad32x16_avg)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
|
|
| void vp9_sad32x16x4d_c(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| void vp9_sad32x16x4d_sse2(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| RTCD_EXTERN void (*vp9_sad32x16x4d)(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
|
|
| unsigned int vp9_sad32x32_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| -#define vp9_sad32x32 vp9_sad32x32_c
|
| +unsigned int vp9_sad32x32_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| +RTCD_EXTERN unsigned int (*vp9_sad32x32)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
|
|
| unsigned int vp9_sad32x32_avg_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| -#define vp9_sad32x32_avg vp9_sad32x32_avg_c
|
| +unsigned int vp9_sad32x32_avg_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| +RTCD_EXTERN unsigned int (*vp9_sad32x32_avg)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
|
|
| void vp9_sad32x32x3_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sad_array);
|
| #define vp9_sad32x32x3 vp9_sad32x32x3_c
|
|
|
| void vp9_sad32x32x4d_c(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| void vp9_sad32x32x4d_sse2(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| +void vp9_sad32x32x4d_avx2(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| RTCD_EXTERN void (*vp9_sad32x32x4d)(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
|
|
| void vp9_sad32x32x8_c(const uint8_t *src_ptr, int src_stride, const uint8_t *ref_ptr, int ref_stride, uint32_t *sad_array);
|
| #define vp9_sad32x32x8 vp9_sad32x32x8_c
|
|
|
| unsigned int vp9_sad32x64_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| -#define vp9_sad32x64 vp9_sad32x64_c
|
| +unsigned int vp9_sad32x64_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| +RTCD_EXTERN unsigned int (*vp9_sad32x64)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
|
|
| unsigned int vp9_sad32x64_avg_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| -#define vp9_sad32x64_avg vp9_sad32x64_avg_c
|
| +unsigned int vp9_sad32x64_avg_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| +RTCD_EXTERN unsigned int (*vp9_sad32x64_avg)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
|
|
| void vp9_sad32x64x4d_c(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| void vp9_sad32x64x4d_sse2(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| @@ -535,26 +551,31 @@ void vp9_sad4x8x8_c(const uint8_t *src_ptr, int src_stride, const uint8_t *ref_p
|
| #define vp9_sad4x8x8 vp9_sad4x8x8_c
|
|
|
| unsigned int vp9_sad64x32_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| -#define vp9_sad64x32 vp9_sad64x32_c
|
| +unsigned int vp9_sad64x32_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| +RTCD_EXTERN unsigned int (*vp9_sad64x32)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
|
|
| unsigned int vp9_sad64x32_avg_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| -#define vp9_sad64x32_avg vp9_sad64x32_avg_c
|
| +unsigned int vp9_sad64x32_avg_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| +RTCD_EXTERN unsigned int (*vp9_sad64x32_avg)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
|
|
| void vp9_sad64x32x4d_c(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| void vp9_sad64x32x4d_sse2(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| RTCD_EXTERN void (*vp9_sad64x32x4d)(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
|
|
| unsigned int vp9_sad64x64_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| -#define vp9_sad64x64 vp9_sad64x64_c
|
| +unsigned int vp9_sad64x64_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
| +RTCD_EXTERN unsigned int (*vp9_sad64x64)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride);
|
|
|
| unsigned int vp9_sad64x64_avg_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| -#define vp9_sad64x64_avg vp9_sad64x64_avg_c
|
| +unsigned int vp9_sad64x64_avg_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
| +RTCD_EXTERN unsigned int (*vp9_sad64x64_avg)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, const uint8_t *second_pred);
|
|
|
| void vp9_sad64x64x3_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sad_array);
|
| #define vp9_sad64x64x3 vp9_sad64x64x3_c
|
|
|
| void vp9_sad64x64x4d_c(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| void vp9_sad64x64x4d_sse2(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| +void vp9_sad64x64x4d_avx2(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| RTCD_EXTERN void (*vp9_sad64x64x4d)(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
|
|
| void vp9_sad64x64x8_c(const uint8_t *src_ptr, int src_stride, const uint8_t *ref_ptr, int ref_stride, uint32_t *sad_array);
|
| @@ -620,7 +641,8 @@ unsigned int vp9_sub_pixel_avg_variance32x16_c(const uint8_t *src_ptr, int sourc
|
| #define vp9_sub_pixel_avg_variance32x16 vp9_sub_pixel_avg_variance32x16_c
|
|
|
| unsigned int vp9_sub_pixel_avg_variance32x32_c(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred);
|
| -#define vp9_sub_pixel_avg_variance32x32 vp9_sub_pixel_avg_variance32x32_c
|
| +unsigned int vp9_sub_pixel_avg_variance32x32_avx2(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred);
|
| +RTCD_EXTERN unsigned int (*vp9_sub_pixel_avg_variance32x32)(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred);
|
|
|
| unsigned int vp9_sub_pixel_avg_variance32x64_c(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred);
|
| #define vp9_sub_pixel_avg_variance32x64 vp9_sub_pixel_avg_variance32x64_c
|
| @@ -635,7 +657,8 @@ unsigned int vp9_sub_pixel_avg_variance64x32_c(const uint8_t *src_ptr, int sourc
|
| #define vp9_sub_pixel_avg_variance64x32 vp9_sub_pixel_avg_variance64x32_c
|
|
|
| unsigned int vp9_sub_pixel_avg_variance64x64_c(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred);
|
| -#define vp9_sub_pixel_avg_variance64x64 vp9_sub_pixel_avg_variance64x64_c
|
| +unsigned int vp9_sub_pixel_avg_variance64x64_avx2(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred);
|
| +RTCD_EXTERN unsigned int (*vp9_sub_pixel_avg_variance64x64)(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred);
|
|
|
| unsigned int vp9_sub_pixel_avg_variance8x16_c(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred);
|
| #define vp9_sub_pixel_avg_variance8x16 vp9_sub_pixel_avg_variance8x16_c
|
| @@ -659,7 +682,8 @@ unsigned int vp9_sub_pixel_variance32x16_c(const uint8_t *src_ptr, int source_st
|
| #define vp9_sub_pixel_variance32x16 vp9_sub_pixel_variance32x16_c
|
|
|
| unsigned int vp9_sub_pixel_variance32x32_c(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| -#define vp9_sub_pixel_variance32x32 vp9_sub_pixel_variance32x32_c
|
| +unsigned int vp9_sub_pixel_variance32x32_avx2(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| +RTCD_EXTERN unsigned int (*vp9_sub_pixel_variance32x32)(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
|
|
| unsigned int vp9_sub_pixel_variance32x64_c(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| #define vp9_sub_pixel_variance32x64 vp9_sub_pixel_variance32x64_c
|
| @@ -674,7 +698,8 @@ unsigned int vp9_sub_pixel_variance64x32_c(const uint8_t *src_ptr, int source_st
|
| #define vp9_sub_pixel_variance64x32 vp9_sub_pixel_variance64x32_c
|
|
|
| unsigned int vp9_sub_pixel_variance64x64_c(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| -#define vp9_sub_pixel_variance64x64 vp9_sub_pixel_variance64x64_c
|
| +unsigned int vp9_sub_pixel_variance64x64_avx2(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| +RTCD_EXTERN unsigned int (*vp9_sub_pixel_variance64x64)(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
|
|
| unsigned int vp9_sub_pixel_variance8x16_c(const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| #define vp9_sub_pixel_variance8x16 vp9_sub_pixel_variance8x16_c
|
| @@ -717,7 +742,8 @@ void vp9_v_predictor_8x8_c(uint8_t *dst, ptrdiff_t y_stride, const uint8_t *abov
|
| #define vp9_v_predictor_8x8 vp9_v_predictor_8x8_c
|
|
|
| unsigned int vp9_variance16x16_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| -#define vp9_variance16x16 vp9_variance16x16_c
|
| +unsigned int vp9_variance16x16_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| +RTCD_EXTERN unsigned int (*vp9_variance16x16)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
|
|
| unsigned int vp9_variance16x32_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| #define vp9_variance16x32 vp9_variance16x32_c
|
| @@ -726,10 +752,12 @@ unsigned int vp9_variance16x8_c(const uint8_t *src_ptr, int source_stride, const
|
| #define vp9_variance16x8 vp9_variance16x8_c
|
|
|
| unsigned int vp9_variance32x16_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| -#define vp9_variance32x16 vp9_variance32x16_c
|
| +unsigned int vp9_variance32x16_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| +RTCD_EXTERN unsigned int (*vp9_variance32x16)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
|
|
| unsigned int vp9_variance32x32_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| -#define vp9_variance32x32 vp9_variance32x32_c
|
| +unsigned int vp9_variance32x32_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| +RTCD_EXTERN unsigned int (*vp9_variance32x32)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
|
|
| unsigned int vp9_variance32x64_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| #define vp9_variance32x64 vp9_variance32x64_c
|
| @@ -741,10 +769,12 @@ unsigned int vp9_variance4x8_c(const uint8_t *src_ptr, int source_stride, const
|
| #define vp9_variance4x8 vp9_variance4x8_c
|
|
|
| unsigned int vp9_variance64x32_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| -#define vp9_variance64x32 vp9_variance64x32_c
|
| +unsigned int vp9_variance64x32_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| +RTCD_EXTERN unsigned int (*vp9_variance64x32)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
|
|
| unsigned int vp9_variance64x64_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| -#define vp9_variance64x64 vp9_variance64x64_c
|
| +unsigned int vp9_variance64x64_avx2(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| +RTCD_EXTERN unsigned int (*vp9_variance64x64)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
|
|
| unsigned int vp9_variance8x16_c(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| #define vp9_variance8x16 vp9_variance8x16_c
|
| @@ -769,9 +799,12 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_SSE2) vp9_avg_4x4 = vp9_avg_4x4_sse2;
|
| vp9_avg_8x8 = vp9_avg_8x8_c;
|
| if (flags & HAS_SSE2) vp9_avg_8x8 = vp9_avg_8x8_sse2;
|
| + vp9_block_error = vp9_block_error_c;
|
| + if (flags & HAS_AVX2) vp9_block_error = vp9_block_error_avx2;
|
| vp9_convolve8 = vp9_convolve8_c;
|
| if (flags & HAS_SSE2) vp9_convolve8 = vp9_convolve8_sse2;
|
| if (flags & HAS_SSSE3) vp9_convolve8 = vp9_convolve8_ssse3;
|
| + if (flags & HAS_AVX2) vp9_convolve8 = vp9_convolve8_avx2;
|
| vp9_convolve8_avg = vp9_convolve8_avg_c;
|
| if (flags & HAS_SSE2) vp9_convolve8_avg = vp9_convolve8_avg_sse2;
|
| if (flags & HAS_SSSE3) vp9_convolve8_avg = vp9_convolve8_avg_ssse3;
|
| @@ -784,9 +817,11 @@ static void setup_rtcd_internal(void)
|
| vp9_convolve8_horiz = vp9_convolve8_horiz_c;
|
| if (flags & HAS_SSE2) vp9_convolve8_horiz = vp9_convolve8_horiz_sse2;
|
| if (flags & HAS_SSSE3) vp9_convolve8_horiz = vp9_convolve8_horiz_ssse3;
|
| + if (flags & HAS_AVX2) vp9_convolve8_horiz = vp9_convolve8_horiz_avx2;
|
| vp9_convolve8_vert = vp9_convolve8_vert_c;
|
| if (flags & HAS_SSE2) vp9_convolve8_vert = vp9_convolve8_vert_sse2;
|
| if (flags & HAS_SSSE3) vp9_convolve8_vert = vp9_convolve8_vert_ssse3;
|
| + if (flags & HAS_AVX2) vp9_convolve8_vert = vp9_convolve8_vert_avx2;
|
| vp9_denoiser_filter = vp9_denoiser_filter_c;
|
| if (flags & HAS_SSE2) vp9_denoiser_filter = vp9_denoiser_filter_sse2;
|
| vp9_fdct16x16 = vp9_fdct16x16_c;
|
| @@ -795,10 +830,12 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_SSE2) vp9_fdct16x16_1 = vp9_fdct16x16_1_sse2;
|
| vp9_fdct32x32 = vp9_fdct32x32_c;
|
| if (flags & HAS_SSE2) vp9_fdct32x32 = vp9_fdct32x32_sse2;
|
| + if (flags & HAS_AVX2) vp9_fdct32x32 = vp9_fdct32x32_avx2;
|
| vp9_fdct32x32_1 = vp9_fdct32x32_1_c;
|
| if (flags & HAS_SSE2) vp9_fdct32x32_1 = vp9_fdct32x32_1_sse2;
|
| vp9_fdct32x32_rd = vp9_fdct32x32_rd_c;
|
| if (flags & HAS_SSE2) vp9_fdct32x32_rd = vp9_fdct32x32_rd_sse2;
|
| + if (flags & HAS_AVX2) vp9_fdct32x32_rd = vp9_fdct32x32_rd_avx2;
|
| vp9_fdct4x4 = vp9_fdct4x4_c;
|
| if (flags & HAS_SSE2) vp9_fdct4x4 = vp9_fdct4x4_sse2;
|
| vp9_fdct4x4_1 = vp9_fdct4x4_1_c;
|
| @@ -819,6 +856,8 @@ static void setup_rtcd_internal(void)
|
| vp9_full_search_sad = vp9_full_search_sad_c;
|
| if (flags & HAS_SSE3) vp9_full_search_sad = vp9_full_search_sadx3;
|
| if (flags & HAS_SSE4_1) vp9_full_search_sad = vp9_full_search_sadx8;
|
| + vp9_get16x16var = vp9_get16x16var_c;
|
| + if (flags & HAS_AVX2) vp9_get16x16var = vp9_get16x16var_avx2;
|
| vp9_idct16x16_10_add = vp9_idct16x16_10_add_c;
|
| if (flags & HAS_SSE2) vp9_idct16x16_10_add = vp9_idct16x16_10_add_sse2;
|
| if (flags & HAS_SSSE3) vp9_idct16x16_10_add = vp9_idct16x16_10_add_ssse3;
|
| @@ -851,6 +890,7 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_SSE2) vp9_iht8x8_64_add = vp9_iht8x8_64_add_sse2;
|
| vp9_lpf_horizontal_16 = vp9_lpf_horizontal_16_c;
|
| if (flags & HAS_SSE2) vp9_lpf_horizontal_16 = vp9_lpf_horizontal_16_sse2;
|
| + if (flags & HAS_AVX2) vp9_lpf_horizontal_16 = vp9_lpf_horizontal_16_avx2;
|
| vp9_lpf_horizontal_4 = vp9_lpf_horizontal_4_c;
|
| if (flags & HAS_MMX) vp9_lpf_horizontal_4 = vp9_lpf_horizontal_4_mmx;
|
| vp9_lpf_horizontal_4_dual = vp9_lpf_horizontal_4_dual_c;
|
| @@ -871,6 +911,8 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_SSE2) vp9_lpf_vertical_8 = vp9_lpf_vertical_8_sse2;
|
| vp9_lpf_vertical_8_dual = vp9_lpf_vertical_8_dual_c;
|
| if (flags & HAS_SSE2) vp9_lpf_vertical_8_dual = vp9_lpf_vertical_8_dual_sse2;
|
| + vp9_mse16x16 = vp9_mse16x16_c;
|
| + if (flags & HAS_AVX2) vp9_mse16x16 = vp9_mse16x16_avx2;
|
| vp9_quantize_b = vp9_quantize_b_c;
|
| if (flags & HAS_SSE2) vp9_quantize_b = vp9_quantize_b_sse2;
|
| vp9_quantize_fp = vp9_quantize_fp_c;
|
| @@ -887,10 +929,23 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_SSSE3) vp9_sad16x8x3 = vp9_sad16x8x3_ssse3;
|
| vp9_sad16x8x4d = vp9_sad16x8x4d_c;
|
| if (flags & HAS_SSE2) vp9_sad16x8x4d = vp9_sad16x8x4d_sse2;
|
| + vp9_sad32x16 = vp9_sad32x16_c;
|
| + if (flags & HAS_AVX2) vp9_sad32x16 = vp9_sad32x16_avx2;
|
| + vp9_sad32x16_avg = vp9_sad32x16_avg_c;
|
| + if (flags & HAS_AVX2) vp9_sad32x16_avg = vp9_sad32x16_avg_avx2;
|
| vp9_sad32x16x4d = vp9_sad32x16x4d_c;
|
| if (flags & HAS_SSE2) vp9_sad32x16x4d = vp9_sad32x16x4d_sse2;
|
| + vp9_sad32x32 = vp9_sad32x32_c;
|
| + if (flags & HAS_AVX2) vp9_sad32x32 = vp9_sad32x32_avx2;
|
| + vp9_sad32x32_avg = vp9_sad32x32_avg_c;
|
| + if (flags & HAS_AVX2) vp9_sad32x32_avg = vp9_sad32x32_avg_avx2;
|
| vp9_sad32x32x4d = vp9_sad32x32x4d_c;
|
| if (flags & HAS_SSE2) vp9_sad32x32x4d = vp9_sad32x32x4d_sse2;
|
| + if (flags & HAS_AVX2) vp9_sad32x32x4d = vp9_sad32x32x4d_avx2;
|
| + vp9_sad32x64 = vp9_sad32x64_c;
|
| + if (flags & HAS_AVX2) vp9_sad32x64 = vp9_sad32x64_avx2;
|
| + vp9_sad32x64_avg = vp9_sad32x64_avg_c;
|
| + if (flags & HAS_AVX2) vp9_sad32x64_avg = vp9_sad32x64_avg_avx2;
|
| vp9_sad32x64x4d = vp9_sad32x64x4d_c;
|
| if (flags & HAS_SSE2) vp9_sad32x64x4d = vp9_sad32x64x4d_sse2;
|
| vp9_sad4x4x3 = vp9_sad4x4x3_c;
|
| @@ -899,10 +954,19 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_SSE) vp9_sad4x4x4d = vp9_sad4x4x4d_sse;
|
| vp9_sad4x8x4d = vp9_sad4x8x4d_c;
|
| if (flags & HAS_SSE) vp9_sad4x8x4d = vp9_sad4x8x4d_sse;
|
| + vp9_sad64x32 = vp9_sad64x32_c;
|
| + if (flags & HAS_AVX2) vp9_sad64x32 = vp9_sad64x32_avx2;
|
| + vp9_sad64x32_avg = vp9_sad64x32_avg_c;
|
| + if (flags & HAS_AVX2) vp9_sad64x32_avg = vp9_sad64x32_avg_avx2;
|
| vp9_sad64x32x4d = vp9_sad64x32x4d_c;
|
| if (flags & HAS_SSE2) vp9_sad64x32x4d = vp9_sad64x32x4d_sse2;
|
| + vp9_sad64x64 = vp9_sad64x64_c;
|
| + if (flags & HAS_AVX2) vp9_sad64x64 = vp9_sad64x64_avx2;
|
| + vp9_sad64x64_avg = vp9_sad64x64_avg_c;
|
| + if (flags & HAS_AVX2) vp9_sad64x64_avg = vp9_sad64x64_avg_avx2;
|
| vp9_sad64x64x4d = vp9_sad64x64x4d_c;
|
| if (flags & HAS_SSE2) vp9_sad64x64x4d = vp9_sad64x64x4d_sse2;
|
| + if (flags & HAS_AVX2) vp9_sad64x64x4d = vp9_sad64x64x4d_avx2;
|
| vp9_sad8x16x3 = vp9_sad8x16x3_c;
|
| if (flags & HAS_SSE3) vp9_sad8x16x3 = vp9_sad8x16x3_sse3;
|
| vp9_sad8x16x4d = vp9_sad8x16x4d_c;
|
| @@ -913,8 +977,26 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_SSE3) vp9_sad8x8x3 = vp9_sad8x8x3_sse3;
|
| vp9_sad8x8x4d = vp9_sad8x8x4d_c;
|
| if (flags & HAS_SSE2) vp9_sad8x8x4d = vp9_sad8x8x4d_sse2;
|
| + vp9_sub_pixel_avg_variance32x32 = vp9_sub_pixel_avg_variance32x32_c;
|
| + if (flags & HAS_AVX2) vp9_sub_pixel_avg_variance32x32 = vp9_sub_pixel_avg_variance32x32_avx2;
|
| + vp9_sub_pixel_avg_variance64x64 = vp9_sub_pixel_avg_variance64x64_c;
|
| + if (flags & HAS_AVX2) vp9_sub_pixel_avg_variance64x64 = vp9_sub_pixel_avg_variance64x64_avx2;
|
| + vp9_sub_pixel_variance32x32 = vp9_sub_pixel_variance32x32_c;
|
| + if (flags & HAS_AVX2) vp9_sub_pixel_variance32x32 = vp9_sub_pixel_variance32x32_avx2;
|
| + vp9_sub_pixel_variance64x64 = vp9_sub_pixel_variance64x64_c;
|
| + if (flags & HAS_AVX2) vp9_sub_pixel_variance64x64 = vp9_sub_pixel_variance64x64_avx2;
|
| vp9_temporal_filter_apply = vp9_temporal_filter_apply_c;
|
| if (flags & HAS_SSE2) vp9_temporal_filter_apply = vp9_temporal_filter_apply_sse2;
|
| + vp9_variance16x16 = vp9_variance16x16_c;
|
| + if (flags & HAS_AVX2) vp9_variance16x16 = vp9_variance16x16_avx2;
|
| + vp9_variance32x16 = vp9_variance32x16_c;
|
| + if (flags & HAS_AVX2) vp9_variance32x16 = vp9_variance32x16_avx2;
|
| + vp9_variance32x32 = vp9_variance32x32_c;
|
| + if (flags & HAS_AVX2) vp9_variance32x32 = vp9_variance32x32_avx2;
|
| + vp9_variance64x32 = vp9_variance64x32_c;
|
| + if (flags & HAS_AVX2) vp9_variance64x32 = vp9_variance64x32_avx2;
|
| + vp9_variance64x64 = vp9_variance64x64_c;
|
| + if (flags & HAS_AVX2) vp9_variance64x64 = vp9_variance64x64_avx2;
|
| }
|
| #endif
|
|
|
|
|