| OLD | NEW |
| (Empty) |
| 1 #ifndef VP9_RTCD_H_ | |
| 2 #define VP9_RTCD_H_ | |
| 3 | |
| 4 #ifdef RTCD_C | |
| 5 #define RTCD_EXTERN | |
| 6 #else | |
| 7 #define RTCD_EXTERN extern | |
| 8 #endif | |
| 9 | |
| 10 /* | |
| 11 * VP9 | |
| 12 */ | |
| 13 | |
| 14 #include "vpx/vpx_integer.h" | |
| 15 #include "vp9/common/vp9_common.h" | |
| 16 #include "vp9/common/vp9_enums.h" | |
| 17 | |
| 18 struct macroblockd; | |
| 19 | |
| 20 /* Encoder forward decls */ | |
| 21 struct macroblock; | |
| 22 struct vp9_variance_vtable; | |
| 23 struct search_site_config; | |
| 24 struct mv; | |
| 25 union int_mv; | |
| 26 struct yv12_buffer_config; | |
| 27 | |
| 28 #ifdef __cplusplus | |
| 29 extern "C" { | |
| 30 #endif | |
| 31 | |
| 32 int64_t vp9_block_error_c(const tran_low_t *coeff, const tran_low_t *dqcoeff, in
tptr_t block_size, int64_t *ssz); | |
| 33 int64_t vp9_block_error_sse2(const tran_low_t *coeff, const tran_low_t *dqcoeff,
intptr_t block_size, int64_t *ssz); | |
| 34 int64_t vp9_block_error_avx2(const tran_low_t *coeff, const tran_low_t *dqcoeff,
intptr_t block_size, int64_t *ssz); | |
| 35 RTCD_EXTERN int64_t (*vp9_block_error)(const tran_low_t *coeff, const tran_low_t
*dqcoeff, intptr_t block_size, int64_t *ssz); | |
| 36 | |
| 37 int64_t vp9_block_error_fp_c(const int16_t *coeff, const int16_t *dqcoeff, int b
lock_size); | |
| 38 int64_t vp9_block_error_fp_sse2(const int16_t *coeff, const int16_t *dqcoeff, in
t block_size); | |
| 39 #define vp9_block_error_fp vp9_block_error_fp_sse2 | |
| 40 | |
| 41 int vp9_denoiser_filter_c(const uint8_t *sig, int sig_stride, const uint8_t *mc_
avg, int mc_avg_stride, uint8_t *avg, int avg_stride, int increase_denoising, BL
OCK_SIZE bs, int motion_magnitude); | |
| 42 int vp9_denoiser_filter_sse2(const uint8_t *sig, int sig_stride, const uint8_t *
mc_avg, int mc_avg_stride, uint8_t *avg, int avg_stride, int increase_denoising,
BLOCK_SIZE bs, int motion_magnitude); | |
| 43 #define vp9_denoiser_filter vp9_denoiser_filter_sse2 | |
| 44 | |
| 45 int vp9_diamond_search_sad_c(const struct macroblock *x, const struct search_sit
e_config *cfg, struct mv *ref_mv, struct mv *best_mv, int search_param, int sad
_per_bit, int *num00, const struct vp9_variance_vtable *fn_ptr, const struct mv
*center_mv); | |
| 46 int vp9_diamond_search_sad_avx(const struct macroblock *x, const struct search_s
ite_config *cfg, struct mv *ref_mv, struct mv *best_mv, int search_param, int s
ad_per_bit, int *num00, const struct vp9_variance_vtable *fn_ptr, const struct m
v *center_mv); | |
| 47 RTCD_EXTERN int (*vp9_diamond_search_sad)(const struct macroblock *x, const stru
ct search_site_config *cfg, struct mv *ref_mv, struct mv *best_mv, int search_p
aram, int sad_per_bit, int *num00, const struct vp9_variance_vtable *fn_ptr, con
st struct mv *center_mv); | |
| 48 | |
| 49 void vp9_fdct8x8_quant_c(const int16_t *input, int stride, tran_low_t *coeff_ptr
, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *rou
nd_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qc
oeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr
, const int16_t *scan, const int16_t *iscan); | |
| 50 void vp9_fdct8x8_quant_sse2(const int16_t *input, int stride, tran_low_t *coeff_
ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *
round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t
*qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_
ptr, const int16_t *scan, const int16_t *iscan); | |
| 51 void vp9_fdct8x8_quant_ssse3(const int16_t *input, int stride, tran_low_t *coeff
_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t
*round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t
*qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob
_ptr, const int16_t *scan, const int16_t *iscan); | |
| 52 RTCD_EXTERN void (*vp9_fdct8x8_quant)(const int16_t *input, int stride, tran_low
_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const
int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, t
ran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint
16_t *eob_ptr, const int16_t *scan, const int16_t *iscan); | |
| 53 | |
| 54 void vp9_fht16x16_c(const int16_t *input, tran_low_t *output, int stride, int tx
_type); | |
| 55 void vp9_fht16x16_sse2(const int16_t *input, tran_low_t *output, int stride, int
tx_type); | |
| 56 #define vp9_fht16x16 vp9_fht16x16_sse2 | |
| 57 | |
| 58 void vp9_fht4x4_c(const int16_t *input, tran_low_t *output, int stride, int tx_t
ype); | |
| 59 void vp9_fht4x4_sse2(const int16_t *input, tran_low_t *output, int stride, int t
x_type); | |
| 60 #define vp9_fht4x4 vp9_fht4x4_sse2 | |
| 61 | |
| 62 void vp9_fht8x8_c(const int16_t *input, tran_low_t *output, int stride, int tx_t
ype); | |
| 63 void vp9_fht8x8_sse2(const int16_t *input, tran_low_t *output, int stride, int t
x_type); | |
| 64 #define vp9_fht8x8 vp9_fht8x8_sse2 | |
| 65 | |
| 66 void vp9_filter_by_weight16x16_c(const uint8_t *src, int src_stride, uint8_t *ds
t, int dst_stride, int src_weight); | |
| 67 void vp9_filter_by_weight16x16_sse2(const uint8_t *src, int src_stride, uint8_t
*dst, int dst_stride, int src_weight); | |
| 68 #define vp9_filter_by_weight16x16 vp9_filter_by_weight16x16_sse2 | |
| 69 | |
| 70 void vp9_filter_by_weight8x8_c(const uint8_t *src, int src_stride, uint8_t *dst,
int dst_stride, int src_weight); | |
| 71 void vp9_filter_by_weight8x8_sse2(const uint8_t *src, int src_stride, uint8_t *d
st, int dst_stride, int src_weight); | |
| 72 #define vp9_filter_by_weight8x8 vp9_filter_by_weight8x8_sse2 | |
| 73 | |
| 74 int vp9_full_search_sad_c(const struct macroblock *x, const struct mv *ref_mv, i
nt sad_per_bit, int distance, const struct vp9_variance_vtable *fn_ptr, const st
ruct mv *center_mv, struct mv *best_mv); | |
| 75 int vp9_full_search_sadx3(const struct macroblock *x, const struct mv *ref_mv, i
nt sad_per_bit, int distance, const struct vp9_variance_vtable *fn_ptr, const st
ruct mv *center_mv, struct mv *best_mv); | |
| 76 int vp9_full_search_sadx8(const struct macroblock *x, const struct mv *ref_mv, i
nt sad_per_bit, int distance, const struct vp9_variance_vtable *fn_ptr, const st
ruct mv *center_mv, struct mv *best_mv); | |
| 77 RTCD_EXTERN int (*vp9_full_search_sad)(const struct macroblock *x, const struct
mv *ref_mv, int sad_per_bit, int distance, const struct vp9_variance_vtable *fn_
ptr, const struct mv *center_mv, struct mv *best_mv); | |
| 78 | |
| 79 void vp9_fwht4x4_c(const int16_t *input, tran_low_t *output, int stride); | |
| 80 void vp9_fwht4x4_mmx(const int16_t *input, tran_low_t *output, int stride); | |
| 81 #define vp9_fwht4x4 vp9_fwht4x4_mmx | |
| 82 | |
| 83 void vp9_iht16x16_256_add_c(const tran_low_t *input, uint8_t *output, int pitch,
int tx_type); | |
| 84 void vp9_iht16x16_256_add_sse2(const tran_low_t *input, uint8_t *output, int pit
ch, int tx_type); | |
| 85 #define vp9_iht16x16_256_add vp9_iht16x16_256_add_sse2 | |
| 86 | |
| 87 void vp9_iht4x4_16_add_c(const tran_low_t *input, uint8_t *dest, int dest_stride
, int tx_type); | |
| 88 void vp9_iht4x4_16_add_sse2(const tran_low_t *input, uint8_t *dest, int dest_str
ide, int tx_type); | |
| 89 #define vp9_iht4x4_16_add vp9_iht4x4_16_add_sse2 | |
| 90 | |
| 91 void vp9_iht8x8_64_add_c(const tran_low_t *input, uint8_t *dest, int dest_stride
, int tx_type); | |
| 92 void vp9_iht8x8_64_add_sse2(const tran_low_t *input, uint8_t *dest, int dest_str
ide, int tx_type); | |
| 93 #define vp9_iht8x8_64_add vp9_iht8x8_64_add_sse2 | |
| 94 | |
| 95 void vp9_mbpost_proc_across_ip_c(uint8_t *src, int pitch, int rows, int cols, in
t flimit); | |
| 96 void vp9_mbpost_proc_across_ip_xmm(uint8_t *src, int pitch, int rows, int cols,
int flimit); | |
| 97 #define vp9_mbpost_proc_across_ip vp9_mbpost_proc_across_ip_xmm | |
| 98 | |
| 99 void vp9_mbpost_proc_down_c(uint8_t *dst, int pitch, int rows, int cols, int fli
mit); | |
| 100 void vp9_mbpost_proc_down_xmm(uint8_t *dst, int pitch, int rows, int cols, int f
limit); | |
| 101 #define vp9_mbpost_proc_down vp9_mbpost_proc_down_xmm | |
| 102 | |
| 103 void vp9_plane_add_noise_c(uint8_t *Start, char *noise, char blackclamp[16], cha
r whiteclamp[16], char bothclamp[16], unsigned int Width, unsigned int Height, i
nt Pitch); | |
| 104 void vp9_plane_add_noise_wmt(uint8_t *Start, char *noise, char blackclamp[16], c
har whiteclamp[16], char bothclamp[16], unsigned int Width, unsigned int Height,
int Pitch); | |
| 105 #define vp9_plane_add_noise vp9_plane_add_noise_wmt | |
| 106 | |
| 107 void vp9_post_proc_down_and_across_c(const uint8_t *src_ptr, uint8_t *dst_ptr, i
nt src_pixels_per_line, int dst_pixels_per_line, int rows, int cols, int flimit)
; | |
| 108 void vp9_post_proc_down_and_across_xmm(const uint8_t *src_ptr, uint8_t *dst_ptr,
int src_pixels_per_line, int dst_pixels_per_line, int rows, int cols, int flimi
t); | |
| 109 #define vp9_post_proc_down_and_across vp9_post_proc_down_and_across_xmm | |
| 110 | |
| 111 void vp9_quantize_fp_c(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_
block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_p
tr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_
ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const i
nt16_t *iscan); | |
| 112 void vp9_quantize_fp_sse2(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int sk
ip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quan
t_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoe
ff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, cons
t int16_t *iscan); | |
| 113 void vp9_quantize_fp_ssse3(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int s
kip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *qua
nt_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqco
eff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, con
st int16_t *iscan); | |
| 114 RTCD_EXTERN void (*vp9_quantize_fp)(const tran_low_t *coeff_ptr, intptr_t n_coef
fs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int
16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_lo
w_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *
scan, const int16_t *iscan); | |
| 115 | |
| 116 void vp9_quantize_fp_32x32_c(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int
skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *q
uant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dq
coeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, c
onst int16_t *iscan); | |
| 117 void vp9_quantize_fp_32x32_ssse3(const tran_low_t *coeff_ptr, intptr_t n_coeffs,
int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_
t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t
*dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *sca
n, const int16_t *iscan); | |
| 118 RTCD_EXTERN void (*vp9_quantize_fp_32x32)(const tran_low_t *coeff_ptr, intptr_t
n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, con
st int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, t
ran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int
16_t *scan, const int16_t *iscan); | |
| 119 | |
| 120 void vp9_scale_and_extend_frame_c(const struct yv12_buffer_config *src, struct y
v12_buffer_config *dst); | |
| 121 void vp9_scale_and_extend_frame_ssse3(const struct yv12_buffer_config *src, stru
ct yv12_buffer_config *dst); | |
| 122 RTCD_EXTERN void (*vp9_scale_and_extend_frame)(const struct yv12_buffer_config *
src, struct yv12_buffer_config *dst); | |
| 123 | |
| 124 void vp9_temporal_filter_apply_c(uint8_t *frame1, unsigned int stride, uint8_t *
frame2, unsigned int block_width, unsigned int block_height, int strength, int f
ilter_weight, unsigned int *accumulator, uint16_t *count); | |
| 125 void vp9_temporal_filter_apply_sse2(uint8_t *frame1, unsigned int stride, uint8_
t *frame2, unsigned int block_width, unsigned int block_height, int strength, in
t filter_weight, unsigned int *accumulator, uint16_t *count); | |
| 126 #define vp9_temporal_filter_apply vp9_temporal_filter_apply_sse2 | |
| 127 | |
| 128 void vp9_rtcd(void); | |
| 129 | |
| 130 #ifdef RTCD_C | |
| 131 #include "vpx_ports/x86.h" | |
| 132 static void setup_rtcd_internal(void) | |
| 133 { | |
| 134 int flags = x86_simd_caps(); | |
| 135 | |
| 136 (void)flags; | |
| 137 | |
| 138 vp9_block_error = vp9_block_error_sse2; | |
| 139 if (flags & HAS_AVX2) vp9_block_error = vp9_block_error_avx2; | |
| 140 vp9_diamond_search_sad = vp9_diamond_search_sad_c; | |
| 141 if (flags & HAS_AVX) vp9_diamond_search_sad = vp9_diamond_search_sad_avx; | |
| 142 vp9_fdct8x8_quant = vp9_fdct8x8_quant_sse2; | |
| 143 if (flags & HAS_SSSE3) vp9_fdct8x8_quant = vp9_fdct8x8_quant_ssse3; | |
| 144 vp9_full_search_sad = vp9_full_search_sad_c; | |
| 145 if (flags & HAS_SSE3) vp9_full_search_sad = vp9_full_search_sadx3; | |
| 146 if (flags & HAS_SSE4_1) vp9_full_search_sad = vp9_full_search_sadx8; | |
| 147 vp9_quantize_fp = vp9_quantize_fp_sse2; | |
| 148 if (flags & HAS_SSSE3) vp9_quantize_fp = vp9_quantize_fp_ssse3; | |
| 149 vp9_quantize_fp_32x32 = vp9_quantize_fp_32x32_c; | |
| 150 if (flags & HAS_SSSE3) vp9_quantize_fp_32x32 = vp9_quantize_fp_32x32_ssse3; | |
| 151 vp9_scale_and_extend_frame = vp9_scale_and_extend_frame_c; | |
| 152 if (flags & HAS_SSSE3) vp9_scale_and_extend_frame = vp9_scale_and_extend_fra
me_ssse3; | |
| 153 } | |
| 154 #endif | |
| 155 | |
| 156 #ifdef __cplusplus | |
| 157 } // extern "C" | |
| 158 #endif | |
| 159 | |
| 160 #endif | |
| OLD | NEW |