| Index: source/config/linux/arm-neon-cpu-detect/vp9_rtcd.h
|
| diff --git a/source/config/linux/arm-neon-cpu-detect/vp9_rtcd.h b/source/config/linux/arm-neon-cpu-detect/vp9_rtcd.h
|
| index 1ae87d1eba9bc09373a7b47fe4899ee1dfe000f0..56bbd99521332db46a07bfbcc44aabfd4964c808 100644
|
| --- a/source/config/linux/arm-neon-cpu-detect/vp9_rtcd.h
|
| +++ b/source/config/linux/arm-neon-cpu-detect/vp9_rtcd.h
|
| @@ -33,7 +33,8 @@ unsigned int vp9_avg_4x4_c(const uint8_t *, int p);
|
| #define vp9_avg_4x4 vp9_avg_4x4_c
|
|
|
| unsigned int vp9_avg_8x8_c(const uint8_t *, int p);
|
| -#define vp9_avg_8x8 vp9_avg_8x8_c
|
| +unsigned int vp9_avg_8x8_neon(const uint8_t *, int p);
|
| +RTCD_EXTERN unsigned int (*vp9_avg_8x8)(const uint8_t *, int p);
|
|
|
| int64_t vp9_block_error_c(const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz);
|
| #define vp9_block_error vp9_block_error_c
|
| @@ -226,7 +227,8 @@ void vp9_fdct8x8_1_neon(const int16_t *input, tran_low_t *output, int stride);
|
| RTCD_EXTERN void (*vp9_fdct8x8_1)(const int16_t *input, tran_low_t *output, int stride);
|
|
|
| void vp9_fdct8x8_quant_c(const int16_t *input, int stride, tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
|
| -#define vp9_fdct8x8_quant vp9_fdct8x8_quant_c
|
| +void vp9_fdct8x8_quant_neon(const int16_t *input, int stride, tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
|
| +RTCD_EXTERN void (*vp9_fdct8x8_quant)(const int16_t *input, int stride, tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
|
|
|
| void vp9_fht16x16_c(const int16_t *input, tran_low_t *output, int stride, int tx_type);
|
| #define vp9_fht16x16 vp9_fht16x16_c
|
| @@ -328,6 +330,12 @@ void vp9_iht8x8_64_add_c(const tran_low_t *input, uint8_t *dest, int dest_stride
|
| void vp9_iht8x8_64_add_neon(const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type);
|
| RTCD_EXTERN void (*vp9_iht8x8_64_add)(const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type);
|
|
|
| +int16_t vp9_int_pro_col_c(uint8_t const *ref, const int width);
|
| +#define vp9_int_pro_col vp9_int_pro_col_c
|
| +
|
| +void vp9_int_pro_row_c(int16_t *hbuf, uint8_t const *ref, const int ref_stride, const int height);
|
| +#define vp9_int_pro_row vp9_int_pro_row_c
|
| +
|
| void vp9_iwht4x4_16_add_c(const tran_low_t *input, uint8_t *dest, int dest_stride);
|
| #define vp9_iwht4x4_16_add vp9_iwht4x4_16_add_c
|
|
|
| @@ -414,7 +422,8 @@ void vp9_sad16x16x3_c(const uint8_t *src_ptr, int source_stride, const uint8_t *
|
| #define vp9_sad16x16x3 vp9_sad16x16x3_c
|
|
|
| void vp9_sad16x16x4d_c(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| -#define vp9_sad16x16x4d vp9_sad16x16x4d_c
|
| +void vp9_sad16x16x4d_neon(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| +RTCD_EXTERN void (*vp9_sad16x16x4d)(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
|
|
| void vp9_sad16x16x8_c(const uint8_t *src_ptr, int src_stride, const uint8_t *ref_ptr, int ref_stride, uint32_t *sad_array);
|
| #define vp9_sad16x16x8 vp9_sad16x16x8_c
|
| @@ -463,7 +472,8 @@ void vp9_sad32x32x3_c(const uint8_t *src_ptr, int source_stride, const uint8_t *
|
| #define vp9_sad32x32x3 vp9_sad32x32x3_c
|
|
|
| void vp9_sad32x32x4d_c(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| -#define vp9_sad32x32x4d vp9_sad32x32x4d_c
|
| +void vp9_sad32x32x4d_neon(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| +RTCD_EXTERN void (*vp9_sad32x32x4d)(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
|
|
| void vp9_sad32x32x8_c(const uint8_t *src_ptr, int src_stride, const uint8_t *ref_ptr, int ref_stride, uint32_t *sad_array);
|
| #define vp9_sad32x32x8 vp9_sad32x32x8_c
|
| @@ -524,7 +534,8 @@ void vp9_sad64x64x3_c(const uint8_t *src_ptr, int source_stride, const uint8_t *
|
| #define vp9_sad64x64x3 vp9_sad64x64x3_c
|
|
|
| void vp9_sad64x64x4d_c(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| -#define vp9_sad64x64x4d vp9_sad64x64x4d_c
|
| +void vp9_sad64x64x4d_neon(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
| +RTCD_EXTERN void (*vp9_sad64x64x4d)(const uint8_t *src_ptr, int src_stride, const uint8_t* const ref_ptr[], int ref_stride, unsigned int *sad_array);
|
|
|
| void vp9_sad64x64x8_c(const uint8_t *src_ptr, int src_stride, const uint8_t *ref_ptr, int ref_stride, uint32_t *sad_array);
|
| #define vp9_sad64x64x8 vp9_sad64x64x8_c
|
| @@ -738,6 +749,9 @@ unsigned int vp9_variance8x8_c(const uint8_t *src_ptr, int source_stride, const
|
| unsigned int vp9_variance8x8_neon(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
| RTCD_EXTERN unsigned int (*vp9_variance8x8)(const uint8_t *src_ptr, int source_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse);
|
|
|
| +int vp9_vector_sad_c(int16_t const *ref, int16_t const *src, const int width);
|
| +#define vp9_vector_sad vp9_vector_sad_c
|
| +
|
| void vp9_rtcd(void);
|
|
|
| #include "vpx_config.h"
|
| @@ -750,6 +764,8 @@ static void setup_rtcd_internal(void)
|
|
|
| (void)flags;
|
|
|
| + vp9_avg_8x8 = vp9_avg_8x8_c;
|
| + if (flags & HAS_NEON) vp9_avg_8x8 = vp9_avg_8x8_neon;
|
| vp9_convolve8 = vp9_convolve8_c;
|
| if (flags & HAS_NEON) vp9_convolve8 = vp9_convolve8_neon;
|
| vp9_convolve8_avg = vp9_convolve8_avg_c;
|
| @@ -770,6 +786,8 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_NEON) vp9_fdct8x8 = vp9_fdct8x8_neon;
|
| vp9_fdct8x8_1 = vp9_fdct8x8_1_c;
|
| if (flags & HAS_NEON) vp9_fdct8x8_1 = vp9_fdct8x8_1_neon;
|
| + vp9_fdct8x8_quant = vp9_fdct8x8_quant_c;
|
| + if (flags & HAS_NEON) vp9_fdct8x8_quant = vp9_fdct8x8_quant_neon;
|
| vp9_get16x16var = vp9_get16x16var_c;
|
| if (flags & HAS_NEON) vp9_get16x16var = vp9_get16x16var_neon;
|
| vp9_get8x8var = vp9_get8x8var_c;
|
| @@ -834,10 +852,16 @@ static void setup_rtcd_internal(void)
|
| if (flags & HAS_NEON) vp9_quantize_fp = vp9_quantize_fp_neon;
|
| vp9_sad16x16 = vp9_sad16x16_c;
|
| if (flags & HAS_NEON) vp9_sad16x16 = vp9_sad16x16_neon;
|
| + vp9_sad16x16x4d = vp9_sad16x16x4d_c;
|
| + if (flags & HAS_NEON) vp9_sad16x16x4d = vp9_sad16x16x4d_neon;
|
| vp9_sad32x32 = vp9_sad32x32_c;
|
| if (flags & HAS_NEON) vp9_sad32x32 = vp9_sad32x32_neon;
|
| + vp9_sad32x32x4d = vp9_sad32x32x4d_c;
|
| + if (flags & HAS_NEON) vp9_sad32x32x4d = vp9_sad32x32x4d_neon;
|
| vp9_sad64x64 = vp9_sad64x64_c;
|
| if (flags & HAS_NEON) vp9_sad64x64 = vp9_sad64x64_neon;
|
| + vp9_sad64x64x4d = vp9_sad64x64x4d_c;
|
| + if (flags & HAS_NEON) vp9_sad64x64x4d = vp9_sad64x64x4d_neon;
|
| vp9_sad8x8 = vp9_sad8x8_c;
|
| if (flags & HAS_NEON) vp9_sad8x8 = vp9_sad8x8_neon;
|
| vp9_sub_pixel_variance16x16 = vp9_sub_pixel_variance16x16_c;
|
|
|