| OLD | NEW |
| 1 sub vpx_dsp_forward_decls() { | 1 sub vpx_dsp_forward_decls() { |
| 2 print <<EOF | 2 print <<EOF |
| 3 /* | 3 /* |
| 4 * DSP | 4 * DSP |
| 5 */ | 5 */ |
| 6 | 6 |
| 7 #include "vpx/vpx_integer.h" | 7 #include "vpx/vpx_integer.h" |
| 8 #include "vpx_dsp/vpx_dsp_common.h" | 8 #include "vpx_dsp/vpx_dsp_common.h" |
| 9 | 9 |
| 10 EOF | 10 EOF |
| (...skipping 36 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 47 $sse2_x86_64 = 'sse2'; | 47 $sse2_x86_64 = 'sse2'; |
| 48 $ssse3_x86_64 = 'ssse3'; | 48 $ssse3_x86_64 = 'ssse3'; |
| 49 $avx_x86_64 = 'avx'; | 49 $avx_x86_64 = 'avx'; |
| 50 $avx2_x86_64 = 'avx2'; | 50 $avx2_x86_64 = 'avx2'; |
| 51 } | 51 } |
| 52 | 52 |
| 53 # | 53 # |
| 54 # Intra prediction | 54 # Intra prediction |
| 55 # | 55 # |
| 56 | 56 |
| 57 if (vpx_config("CONFIG_VP9") eq "yes") { | 57 if ((vpx_config("CONFIG_VP9") eq "yes") || (vpx_config("CONFIG_VP10") eq "yes"))
{ |
| 58 add_proto qw/void vpx_d207_predictor_4x4/, "uint8_t *dst, ptrdiff_t y_stride,
const uint8_t *above, const uint8_t *left"; | 58 add_proto qw/void vpx_d207_predictor_4x4/, "uint8_t *dst, ptrdiff_t y_stride,
const uint8_t *above, const uint8_t *left"; |
| 59 specialize qw/vpx_d207_predictor_4x4/, "$ssse3_x86inc"; | 59 specialize qw/vpx_d207_predictor_4x4/, "$ssse3_x86inc"; |
| 60 | 60 |
| 61 add_proto qw/void vpx_d45_predictor_4x4/, "uint8_t *dst, ptrdiff_t y_stride, c
onst uint8_t *above, const uint8_t *left"; | 61 add_proto qw/void vpx_d45_predictor_4x4/, "uint8_t *dst, ptrdiff_t y_stride, c
onst uint8_t *above, const uint8_t *left"; |
| 62 specialize qw/vpx_d45_predictor_4x4 neon/, "$ssse3_x86inc"; | 62 specialize qw/vpx_d45_predictor_4x4 neon/, "$ssse3_x86inc"; |
| 63 | 63 |
| 64 add_proto qw/void vpx_d63_predictor_4x4/, "uint8_t *dst, ptrdiff_t y_stride, c
onst uint8_t *above, const uint8_t *left"; | 64 add_proto qw/void vpx_d63_predictor_4x4/, "uint8_t *dst, ptrdiff_t y_stride, c
onst uint8_t *above, const uint8_t *left"; |
| 65 specialize qw/vpx_d63_predictor_4x4/, "$ssse3_x86inc"; | 65 specialize qw/vpx_d63_predictor_4x4/, "$ssse3_x86inc"; |
| 66 | 66 |
| 67 add_proto qw/void vpx_h_predictor_4x4/, "uint8_t *dst, ptrdiff_t y_stride, con
st uint8_t *above, const uint8_t *left"; | 67 add_proto qw/void vpx_h_predictor_4x4/, "uint8_t *dst, ptrdiff_t y_stride, con
st uint8_t *above, const uint8_t *left"; |
| (...skipping 294 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 362 | 362 |
| 363 add_proto qw/void vpx_highbd_dc_top_predictor_32x32/, "uint16_t *dst, ptrdif
f_t y_stride, const uint16_t *above, const uint16_t *left, int bd"; | 363 add_proto qw/void vpx_highbd_dc_top_predictor_32x32/, "uint16_t *dst, ptrdif
f_t y_stride, const uint16_t *above, const uint16_t *left, int bd"; |
| 364 specialize qw/vpx_highbd_dc_top_predictor_32x32/; | 364 specialize qw/vpx_highbd_dc_top_predictor_32x32/; |
| 365 | 365 |
| 366 add_proto qw/void vpx_highbd_dc_left_predictor_32x32/, "uint16_t *dst, ptrdi
ff_t y_stride, const uint16_t *above, const uint16_t *left, int bd"; | 366 add_proto qw/void vpx_highbd_dc_left_predictor_32x32/, "uint16_t *dst, ptrdi
ff_t y_stride, const uint16_t *above, const uint16_t *left, int bd"; |
| 367 specialize qw/vpx_highbd_dc_left_predictor_32x32/; | 367 specialize qw/vpx_highbd_dc_left_predictor_32x32/; |
| 368 | 368 |
| 369 add_proto qw/void vpx_highbd_dc_128_predictor_32x32/, "uint16_t *dst, ptrdif
f_t y_stride, const uint16_t *above, const uint16_t *left, int bd"; | 369 add_proto qw/void vpx_highbd_dc_128_predictor_32x32/, "uint16_t *dst, ptrdif
f_t y_stride, const uint16_t *above, const uint16_t *left, int bd"; |
| 370 specialize qw/vpx_highbd_dc_128_predictor_32x32/; | 370 specialize qw/vpx_highbd_dc_128_predictor_32x32/; |
| 371 } # CONFIG_VP9_HIGHBITDEPTH | 371 } # CONFIG_VP9_HIGHBITDEPTH |
| 372 } # CONFIG_VP9 | 372 } # CONFIG_VP9 || CONFIG_VP10 |
| 373 | 373 |
| 374 # | 374 # |
| 375 # Sub Pixel Filters | 375 # Sub Pixel Filters |
| 376 # | 376 # |
| 377 add_proto qw/void vpx_convolve_copy/, "const uint8_t *src, ptrdiff_t src_stride,
uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, con
st int16_t *filter_y, int y_step_q4, int w, int h"; | 377 add_proto qw/void vpx_convolve_copy/, "const uint8_t *src, ptrdiff_t src_stride,
uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, con
st int16_t *filter_y, int y_step_q4, int w, int h"; |
| 378 specialize qw/vpx_convolve_copy neon dspr2 msa/, "$sse2_x86inc"; | 378 specialize qw/vpx_convolve_copy neon dspr2 msa/, "$sse2_x86inc"; |
| 379 | 379 |
| 380 add_proto qw/void vpx_convolve_avg/, "const uint8_t *src, ptrdiff_t src_stride,
uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, cons
t int16_t *filter_y, int y_step_q4, int w, int h"; | 380 add_proto qw/void vpx_convolve_avg/, "const uint8_t *src, ptrdiff_t src_stride,
uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, cons
t int16_t *filter_y, int y_step_q4, int w, int h"; |
| 381 specialize qw/vpx_convolve_avg neon dspr2 msa/, "$sse2_x86inc"; | 381 specialize qw/vpx_convolve_avg neon dspr2 msa/, "$sse2_x86inc"; |
| 382 | 382 |
| 383 add_proto qw/void vpx_convolve8/, "const uint8_t *src, ptrdiff_t src_stride, uin
t8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const i
nt16_t *filter_y, int y_step_q4, int w, int h"; | 383 add_proto qw/void vpx_convolve8/, "const uint8_t *src, ptrdiff_t src_stride, uin
t8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const i
nt16_t *filter_y, int y_step_q4, int w, int h"; |
| 384 specialize qw/vpx_convolve8 sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3"; | 384 specialize qw/vpx_convolve8 sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3"; |
| 385 | 385 |
| 386 add_proto qw/void vpx_convolve8_horiz/, "const uint8_t *src, ptrdiff_t src_strid
e, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, c
onst int16_t *filter_y, int y_step_q4, int w, int h"; | 386 add_proto qw/void vpx_convolve8_horiz/, "const uint8_t *src, ptrdiff_t src_strid
e, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, c
onst int16_t *filter_y, int y_step_q4, int w, int h"; |
| 387 specialize qw/vpx_convolve8_horiz sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3"; | 387 specialize qw/vpx_convolve8_horiz sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3"; |
| 388 | 388 |
| 389 add_proto qw/void vpx_convolve8_vert/, "const uint8_t *src, ptrdiff_t src_stride
, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, co
nst int16_t *filter_y, int y_step_q4, int w, int h"; | 389 add_proto qw/void vpx_convolve8_vert/, "const uint8_t *src, ptrdiff_t src_stride
, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, co
nst int16_t *filter_y, int y_step_q4, int w, int h"; |
| 390 specialize qw/vpx_convolve8_vert sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3"; | 390 specialize qw/vpx_convolve8_vert sse2 ssse3 neon dspr2 msa/, "$avx2_ssse3"; |
| 391 | 391 |
| 392 add_proto qw/void vpx_convolve8_avg/, "const uint8_t *src, ptrdiff_t src_stride,
uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, con
st int16_t *filter_y, int y_step_q4, int w, int h"; | 392 add_proto qw/void vpx_convolve8_avg/, "const uint8_t *src, ptrdiff_t src_stride,
uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, con
st int16_t *filter_y, int y_step_q4, int w, int h"; |
| 393 specialize qw/vpx_convolve8_avg sse2 ssse3 neon dspr2 msa/; | 393 specialize qw/vpx_convolve8_avg sse2 ssse3 neon dspr2 msa/; |
| 394 | 394 |
| 395 add_proto qw/void vpx_convolve8_avg_horiz/, "const uint8_t *src, ptrdiff_t src_s
tride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q
4, const int16_t *filter_y, int y_step_q4, int w, int h"; | 395 add_proto qw/void vpx_convolve8_avg_horiz/, "const uint8_t *src, ptrdiff_t src_s
tride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q
4, const int16_t *filter_y, int y_step_q4, int w, int h"; |
| 396 specialize qw/vpx_convolve8_avg_horiz sse2 ssse3 neon dspr2 msa/; | 396 specialize qw/vpx_convolve8_avg_horiz sse2 ssse3 neon dspr2 msa/; |
| 397 | 397 |
| 398 add_proto qw/void vpx_convolve8_avg_vert/, "const uint8_t *src, ptrdiff_t src_st
ride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4
, const int16_t *filter_y, int y_step_q4, int w, int h"; | 398 add_proto qw/void vpx_convolve8_avg_vert/, "const uint8_t *src, ptrdiff_t src_st
ride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4
, const int16_t *filter_y, int y_step_q4, int w, int h"; |
| 399 specialize qw/vpx_convolve8_avg_vert sse2 ssse3 neon dspr2 msa/; | 399 specialize qw/vpx_convolve8_avg_vert sse2 ssse3 neon dspr2 msa/; |
| 400 | 400 |
| 401 add_proto qw/void vpx_scaled_2d/, "const uint8_t *src, ptrdiff_t src_stride, uin
t8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const i
nt16_t *filter_y, int y_step_q4, int w, int h"; |
| 402 specialize qw/vpx_scaled_2d ssse3/; |
| 403 |
| 404 add_proto qw/void vpx_scaled_horiz/, "const uint8_t *src, ptrdiff_t src_stride,
uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, cons
t int16_t *filter_y, int y_step_q4, int w, int h"; |
| 405 specialize qw/vpx_scaled_horiz/; |
| 406 |
| 407 add_proto qw/void vpx_scaled_vert/, "const uint8_t *src, ptrdiff_t src_stride, u
int8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const
int16_t *filter_y, int y_step_q4, int w, int h"; |
| 408 specialize qw/vpx_scaled_vert/; |
| 409 |
| 410 add_proto qw/void vpx_scaled_avg_2d/, "const uint8_t *src, ptrdiff_t src_stride,
uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, con
st int16_t *filter_y, int y_step_q4, int w, int h"; |
| 411 specialize qw/vpx_scaled_avg_2d/; |
| 412 |
| 413 add_proto qw/void vpx_scaled_avg_horiz/, "const uint8_t *src, ptrdiff_t src_stri
de, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4,
const int16_t *filter_y, int y_step_q4, int w, int h"; |
| 414 specialize qw/vpx_scaled_avg_horiz/; |
| 415 |
| 416 add_proto qw/void vpx_scaled_avg_vert/, "const uint8_t *src, ptrdiff_t src_strid
e, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, c
onst int16_t *filter_y, int y_step_q4, int w, int h"; |
| 417 specialize qw/vpx_scaled_avg_vert/; |
| 418 |
| 401 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { | 419 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { |
| 402 # | 420 # |
| 403 # Sub Pixel Filters | 421 # Sub Pixel Filters |
| 404 # | 422 # |
| 405 add_proto qw/void vpx_highbd_convolve_copy/, "const uint8_t *src, ptrdiff_t sr
c_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_ste
p_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps"; | 423 add_proto qw/void vpx_highbd_convolve_copy/, "const uint8_t *src, ptrdiff_t sr
c_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_ste
p_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps"; |
| 406 specialize qw/vpx_highbd_convolve_copy/; | 424 specialize qw/vpx_highbd_convolve_copy/; |
| 407 | 425 |
| 408 add_proto qw/void vpx_highbd_convolve_avg/, "const uint8_t *src, ptrdiff_t src
_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step
_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps"; | 426 add_proto qw/void vpx_highbd_convolve_avg/, "const uint8_t *src, ptrdiff_t src
_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step
_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps"; |
| 409 specialize qw/vpx_highbd_convolve_avg/; | 427 specialize qw/vpx_highbd_convolve_avg/; |
| 410 | 428 |
| (...skipping 13 matching lines...) Expand all Loading... |
| 424 specialize qw/vpx_highbd_convolve8_avg_horiz/, "$sse2_x86_64"; | 442 specialize qw/vpx_highbd_convolve8_avg_horiz/, "$sse2_x86_64"; |
| 425 | 443 |
| 426 add_proto qw/void vpx_highbd_convolve8_avg_vert/, "const uint8_t *src, ptrdiff
_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int
x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps"; | 444 add_proto qw/void vpx_highbd_convolve8_avg_vert/, "const uint8_t *src, ptrdiff
_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int
x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps"; |
| 427 specialize qw/vpx_highbd_convolve8_avg_vert/, "$sse2_x86_64"; | 445 specialize qw/vpx_highbd_convolve8_avg_vert/, "$sse2_x86_64"; |
| 428 } # CONFIG_VP9_HIGHBITDEPTH | 446 } # CONFIG_VP9_HIGHBITDEPTH |
| 429 | 447 |
| 430 # | 448 # |
| 431 # Loopfilter | 449 # Loopfilter |
| 432 # | 450 # |
| 433 add_proto qw/void vpx_lpf_vertical_16/, "uint8_t *s, int pitch, const uint8_t *b
limit, const uint8_t *limit, const uint8_t *thresh"; | 451 add_proto qw/void vpx_lpf_vertical_16/, "uint8_t *s, int pitch, const uint8_t *b
limit, const uint8_t *limit, const uint8_t *thresh"; |
| 434 specialize qw/vpx_lpf_vertical_16 sse2 neon_asm msa/; | 452 specialize qw/vpx_lpf_vertical_16 sse2 neon_asm dspr2 msa/; |
| 435 $vpx_lpf_vertical_16_neon_asm=vpx_lpf_vertical_16_neon; | 453 $vpx_lpf_vertical_16_neon_asm=vpx_lpf_vertical_16_neon; |
| 436 | 454 |
| 437 add_proto qw/void vpx_lpf_vertical_16_dual/, "uint8_t *s, int pitch, const uint8
_t *blimit, const uint8_t *limit, const uint8_t *thresh"; | 455 add_proto qw/void vpx_lpf_vertical_16_dual/, "uint8_t *s, int pitch, const uint8
_t *blimit, const uint8_t *limit, const uint8_t *thresh"; |
| 438 specialize qw/vpx_lpf_vertical_16_dual sse2 neon_asm msa/; | 456 specialize qw/vpx_lpf_vertical_16_dual sse2 neon_asm dspr2 msa/; |
| 439 $vpx_lpf_vertical_16_dual_neon_asm=vpx_lpf_vertical_16_dual_neon; | 457 $vpx_lpf_vertical_16_dual_neon_asm=vpx_lpf_vertical_16_dual_neon; |
| 440 | 458 |
| 441 add_proto qw/void vpx_lpf_vertical_8/, "uint8_t *s, int pitch, const uint8_t *bl
imit, const uint8_t *limit, const uint8_t *thresh, int count"; | 459 add_proto qw/void vpx_lpf_vertical_8/, "uint8_t *s, int pitch, const uint8_t *bl
imit, const uint8_t *limit, const uint8_t *thresh, int count"; |
| 442 specialize qw/vpx_lpf_vertical_8 sse2 neon msa/; | 460 specialize qw/vpx_lpf_vertical_8 sse2 neon dspr2 msa/; |
| 443 | 461 |
| 444 add_proto qw/void vpx_lpf_vertical_8_dual/, "uint8_t *s, int pitch, const uint8_
t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit
1, const uint8_t *limit1, const uint8_t *thresh1"; | 462 add_proto qw/void vpx_lpf_vertical_8_dual/, "uint8_t *s, int pitch, const uint8_
t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit
1, const uint8_t *limit1, const uint8_t *thresh1"; |
| 445 specialize qw/vpx_lpf_vertical_8_dual sse2 neon_asm msa/; | 463 specialize qw/vpx_lpf_vertical_8_dual sse2 neon_asm dspr2 msa/; |
| 446 $vpx_lpf_vertical_8_dual_neon_asm=vpx_lpf_vertical_8_dual_neon; | 464 $vpx_lpf_vertical_8_dual_neon_asm=vpx_lpf_vertical_8_dual_neon; |
| 447 | 465 |
| 448 add_proto qw/void vpx_lpf_vertical_4/, "uint8_t *s, int pitch, const uint8_t *bl
imit, const uint8_t *limit, const uint8_t *thresh, int count"; | 466 add_proto qw/void vpx_lpf_vertical_4/, "uint8_t *s, int pitch, const uint8_t *bl
imit, const uint8_t *limit, const uint8_t *thresh, int count"; |
| 449 specialize qw/vpx_lpf_vertical_4 mmx neon msa/; | 467 specialize qw/vpx_lpf_vertical_4 mmx neon dspr2 msa/; |
| 450 | 468 |
| 451 add_proto qw/void vpx_lpf_vertical_4_dual/, "uint8_t *s, int pitch, const uint8_
t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit
1, const uint8_t *limit1, const uint8_t *thresh1"; | 469 add_proto qw/void vpx_lpf_vertical_4_dual/, "uint8_t *s, int pitch, const uint8_
t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit
1, const uint8_t *limit1, const uint8_t *thresh1"; |
| 452 specialize qw/vpx_lpf_vertical_4_dual sse2 neon msa/; | 470 specialize qw/vpx_lpf_vertical_4_dual sse2 neon dspr2 msa/; |
| 453 | 471 |
| 454 add_proto qw/void vpx_lpf_horizontal_16/, "uint8_t *s, int pitch, const uint8_t
*blimit, const uint8_t *limit, const uint8_t *thresh, int count"; | 472 add_proto qw/void vpx_lpf_horizontal_16/, "uint8_t *s, int pitch, const uint8_t
*blimit, const uint8_t *limit, const uint8_t *thresh, int count"; |
| 455 specialize qw/vpx_lpf_horizontal_16 sse2 avx2 neon_asm msa/; | 473 specialize qw/vpx_lpf_horizontal_16 sse2 avx2 neon_asm dspr2 msa/; |
| 456 $vpx_lpf_horizontal_16_neon_asm=vpx_lpf_horizontal_16_neon; | 474 $vpx_lpf_horizontal_16_neon_asm=vpx_lpf_horizontal_16_neon; |
| 457 | 475 |
| 458 add_proto qw/void vpx_lpf_horizontal_8/, "uint8_t *s, int pitch, const uint8_t *
blimit, const uint8_t *limit, const uint8_t *thresh, int count"; | 476 add_proto qw/void vpx_lpf_horizontal_8/, "uint8_t *s, int pitch, const uint8_t *
blimit, const uint8_t *limit, const uint8_t *thresh, int count"; |
| 459 specialize qw/vpx_lpf_horizontal_8 sse2 neon msa/; | 477 specialize qw/vpx_lpf_horizontal_8 sse2 neon dspr2 msa/; |
| 460 | 478 |
| 461 add_proto qw/void vpx_lpf_horizontal_8_dual/, "uint8_t *s, int pitch, const uint
8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blim
it1, const uint8_t *limit1, const uint8_t *thresh1"; | 479 add_proto qw/void vpx_lpf_horizontal_8_dual/, "uint8_t *s, int pitch, const uint
8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blim
it1, const uint8_t *limit1, const uint8_t *thresh1"; |
| 462 specialize qw/vpx_lpf_horizontal_8_dual sse2 neon_asm msa/; | 480 specialize qw/vpx_lpf_horizontal_8_dual sse2 neon_asm dspr2 msa/; |
| 463 $vpx_lpf_horizontal_8_dual_neon_asm=vpx_lpf_horizontal_8_dual_neon; | 481 $vpx_lpf_horizontal_8_dual_neon_asm=vpx_lpf_horizontal_8_dual_neon; |
| 464 | 482 |
| 465 add_proto qw/void vpx_lpf_horizontal_4/, "uint8_t *s, int pitch, const uint8_t *
blimit, const uint8_t *limit, const uint8_t *thresh, int count"; | 483 add_proto qw/void vpx_lpf_horizontal_4/, "uint8_t *s, int pitch, const uint8_t *
blimit, const uint8_t *limit, const uint8_t *thresh, int count"; |
| 466 specialize qw/vpx_lpf_horizontal_4 mmx neon msa/; | 484 specialize qw/vpx_lpf_horizontal_4 mmx neon dspr2 msa/; |
| 467 | 485 |
| 468 add_proto qw/void vpx_lpf_horizontal_4_dual/, "uint8_t *s, int pitch, const uint
8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blim
it1, const uint8_t *limit1, const uint8_t *thresh1"; | 486 add_proto qw/void vpx_lpf_horizontal_4_dual/, "uint8_t *s, int pitch, const uint
8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blim
it1, const uint8_t *limit1, const uint8_t *thresh1"; |
| 469 specialize qw/vpx_lpf_horizontal_4_dual sse2 neon msa/; | 487 specialize qw/vpx_lpf_horizontal_4_dual sse2 neon dspr2 msa/; |
| 470 | 488 |
| 471 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { | 489 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { |
| 472 add_proto qw/void vpx_highbd_lpf_vertical_16/, "uint16_t *s, int pitch, const
uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int bd"; | 490 add_proto qw/void vpx_highbd_lpf_vertical_16/, "uint16_t *s, int pitch, const
uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int bd"; |
| 473 specialize qw/vpx_highbd_lpf_vertical_16 sse2/; | 491 specialize qw/vpx_highbd_lpf_vertical_16 sse2/; |
| 474 | 492 |
| 475 add_proto qw/void vpx_highbd_lpf_vertical_16_dual/, "uint16_t *s, int pitch, c
onst uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int bd"; | 493 add_proto qw/void vpx_highbd_lpf_vertical_16_dual/, "uint16_t *s, int pitch, c
onst uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int bd"; |
| 476 specialize qw/vpx_highbd_lpf_vertical_16_dual sse2/; | 494 specialize qw/vpx_highbd_lpf_vertical_16_dual sse2/; |
| 477 | 495 |
| 478 add_proto qw/void vpx_highbd_lpf_vertical_8/, "uint16_t *s, int pitch, const u
int8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count, int bd"; | 496 add_proto qw/void vpx_highbd_lpf_vertical_8/, "uint16_t *s, int pitch, const u
int8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count, int bd"; |
| 479 specialize qw/vpx_highbd_lpf_vertical_8 sse2/; | 497 specialize qw/vpx_highbd_lpf_vertical_8 sse2/; |
| (...skipping 23 matching lines...) Expand all Loading... |
| 503 specialize qw/vpx_highbd_lpf_horizontal_4_dual sse2/; | 521 specialize qw/vpx_highbd_lpf_horizontal_4_dual sse2/; |
| 504 } # CONFIG_VP9_HIGHBITDEPTH | 522 } # CONFIG_VP9_HIGHBITDEPTH |
| 505 | 523 |
| 506 # | 524 # |
| 507 # Encoder functions. | 525 # Encoder functions. |
| 508 # | 526 # |
| 509 | 527 |
| 510 # | 528 # |
| 511 # Forward transform | 529 # Forward transform |
| 512 # | 530 # |
| 513 if (vpx_config("CONFIG_VP9_ENCODER") eq "yes") { | 531 if ((vpx_config("CONFIG_VP9_ENCODER") eq "yes") || (vpx_config("CONFIG_VP10_ENCO
DER") eq "yes")) { |
| 514 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { | 532 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { |
| 515 add_proto qw/void vpx_fdct4x4/, "const int16_t *input, tran_low_t *output, int
stride"; | 533 add_proto qw/void vpx_fdct4x4/, "const int16_t *input, tran_low_t *output, int
stride"; |
| 516 specialize qw/vpx_fdct4x4 sse2/; | 534 specialize qw/vpx_fdct4x4 sse2/; |
| 517 | 535 |
| 518 add_proto qw/void vpx_fdct4x4_1/, "const int16_t *input, tran_low_t *output, i
nt stride"; | 536 add_proto qw/void vpx_fdct4x4_1/, "const int16_t *input, tran_low_t *output, i
nt stride"; |
| 519 specialize qw/vpx_fdct4x4_1 sse2/; | 537 specialize qw/vpx_fdct4x4_1 sse2/; |
| 520 | 538 |
| 521 add_proto qw/void vpx_fdct8x8/, "const int16_t *input, tran_low_t *output, int
stride"; | 539 add_proto qw/void vpx_fdct8x8/, "const int16_t *input, tran_low_t *output, int
stride"; |
| 522 specialize qw/vpx_fdct8x8 sse2/; | 540 specialize qw/vpx_fdct8x8 sse2/; |
| 523 | 541 |
| (...skipping 59 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 583 | 601 |
| 584 add_proto qw/void vpx_fdct32x32/, "const int16_t *input, tran_low_t *output, i
nt stride"; | 602 add_proto qw/void vpx_fdct32x32/, "const int16_t *input, tran_low_t *output, i
nt stride"; |
| 585 specialize qw/vpx_fdct32x32 sse2 avx2 msa/; | 603 specialize qw/vpx_fdct32x32 sse2 avx2 msa/; |
| 586 | 604 |
| 587 add_proto qw/void vpx_fdct32x32_rd/, "const int16_t *input, tran_low_t *output
, int stride"; | 605 add_proto qw/void vpx_fdct32x32_rd/, "const int16_t *input, tran_low_t *output
, int stride"; |
| 588 specialize qw/vpx_fdct32x32_rd sse2 avx2 msa/; | 606 specialize qw/vpx_fdct32x32_rd sse2 avx2 msa/; |
| 589 | 607 |
| 590 add_proto qw/void vpx_fdct32x32_1/, "const int16_t *input, tran_low_t *output,
int stride"; | 608 add_proto qw/void vpx_fdct32x32_1/, "const int16_t *input, tran_low_t *output,
int stride"; |
| 591 specialize qw/vpx_fdct32x32_1 sse2 msa/; | 609 specialize qw/vpx_fdct32x32_1 sse2 msa/; |
| 592 } # CONFIG_VP9_HIGHBITDEPTH | 610 } # CONFIG_VP9_HIGHBITDEPTH |
| 593 } # CONFIG_VP9_ENCODER | 611 } # CONFIG_VP9_ENCODER || CONFIG_VP10_ENCODER |
| 594 | 612 |
| 595 # | 613 # |
| 596 # Inverse transform | 614 # Inverse transform |
| 597 if (vpx_config("CONFIG_VP9") eq "yes") { | 615 if ((vpx_config("CONFIG_VP9") eq "yes") || (vpx_config("CONFIG_VP10") eq "yes"))
{ |
| 598 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { | 616 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { |
| 599 # Note as optimized versions of these functions are added we need to add a che
ck to ensure | 617 # Note as optimized versions of these functions are added we need to add a che
ck to ensure |
| 600 # that when CONFIG_EMULATE_HARDWARE is on, it defaults to the C versions only. | 618 # that when CONFIG_EMULATE_HARDWARE is on, it defaults to the C versions only. |
| 601 add_proto qw/void vp9_idct4x4_1_add/, "const tran_low_t *input, uint8_t *dest,
int dest_stride"; | 619 add_proto qw/void vpx_idct4x4_1_add/, "const tran_low_t *input, uint8_t *dest,
int dest_stride"; |
| 602 specialize qw/vp9_idct4x4_1_add/; | 620 specialize qw/vpx_idct4x4_1_add/; |
| 603 | 621 |
| 604 add_proto qw/void vp9_idct4x4_16_add/, "const tran_low_t *input, uint8_t *dest
, int dest_stride"; | 622 add_proto qw/void vpx_idct4x4_16_add/, "const tran_low_t *input, uint8_t *dest
, int dest_stride"; |
| 605 specialize qw/vp9_idct4x4_16_add/; | 623 specialize qw/vpx_idct4x4_16_add/; |
| 606 | 624 |
| 607 add_proto qw/void vp9_idct8x8_1_add/, "const tran_low_t *input, uint8_t *dest,
int dest_stride"; | 625 add_proto qw/void vpx_idct8x8_1_add/, "const tran_low_t *input, uint8_t *dest,
int dest_stride"; |
| 608 specialize qw/vp9_idct8x8_1_add/; | 626 specialize qw/vpx_idct8x8_1_add/; |
| 609 | 627 |
| 610 add_proto qw/void vp9_idct8x8_64_add/, "const tran_low_t *input, uint8_t *dest
, int dest_stride"; | 628 add_proto qw/void vpx_idct8x8_64_add/, "const tran_low_t *input, uint8_t *dest
, int dest_stride"; |
| 611 specialize qw/vp9_idct8x8_64_add/; | 629 specialize qw/vpx_idct8x8_64_add/; |
| 612 | 630 |
| 613 add_proto qw/void vp9_idct8x8_12_add/, "const tran_low_t *input, uint8_t *dest
, int dest_stride"; | 631 add_proto qw/void vpx_idct8x8_12_add/, "const tran_low_t *input, uint8_t *dest
, int dest_stride"; |
| 614 specialize qw/vp9_idct8x8_12_add/; | 632 specialize qw/vpx_idct8x8_12_add/; |
| 615 | 633 |
| 616 add_proto qw/void vp9_idct16x16_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; | 634 add_proto qw/void vpx_idct16x16_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; |
| 617 specialize qw/vp9_idct16x16_1_add/; | 635 specialize qw/vpx_idct16x16_1_add/; |
| 618 | 636 |
| 619 add_proto qw/void vp9_idct16x16_256_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; | 637 add_proto qw/void vpx_idct16x16_256_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; |
| 620 specialize qw/vp9_idct16x16_256_add/; | 638 specialize qw/vpx_idct16x16_256_add/; |
| 621 | 639 |
| 622 add_proto qw/void vp9_idct16x16_10_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 640 add_proto qw/void vpx_idct16x16_10_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 623 specialize qw/vp9_idct16x16_10_add/; | 641 specialize qw/vpx_idct16x16_10_add/; |
| 624 | 642 |
| 625 add_proto qw/void vp9_idct32x32_1024_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; | 643 add_proto qw/void vpx_idct32x32_1024_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; |
| 626 specialize qw/vp9_idct32x32_1024_add/; | 644 specialize qw/vpx_idct32x32_1024_add/; |
| 627 | 645 |
| 628 add_proto qw/void vp9_idct32x32_34_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 646 add_proto qw/void vpx_idct32x32_34_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 629 specialize qw/vp9_idct32x32_34_add/; | 647 specialize qw/vpx_idct32x32_34_add/; |
| 630 | 648 |
| 631 add_proto qw/void vp9_idct32x32_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; | 649 add_proto qw/void vpx_idct32x32_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; |
| 632 specialize qw/vp9_idct32x32_1_add/; | 650 specialize qw/vpx_idct32x32_1_add/; |
| 633 | 651 |
| 634 add_proto qw/void vp9_iwht4x4_1_add/, "const tran_low_t *input, uint8_t *dest,
int dest_stride"; | 652 add_proto qw/void vpx_iwht4x4_1_add/, "const tran_low_t *input, uint8_t *dest,
int dest_stride"; |
| 635 specialize qw/vp9_iwht4x4_1_add/; | 653 specialize qw/vpx_iwht4x4_1_add/; |
| 636 | 654 |
| 637 add_proto qw/void vp9_iwht4x4_16_add/, "const tran_low_t *input, uint8_t *dest
, int dest_stride"; | 655 add_proto qw/void vpx_iwht4x4_16_add/, "const tran_low_t *input, uint8_t *dest
, int dest_stride"; |
| 638 specialize qw/vp9_iwht4x4_16_add/; | 656 specialize qw/vpx_iwht4x4_16_add/; |
| 639 | 657 |
| 640 add_proto qw/void vp9_highbd_idct4x4_1_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride, int bd"; | 658 add_proto qw/void vpx_highbd_idct4x4_1_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride, int bd"; |
| 641 specialize qw/vp9_highbd_idct4x4_1_add/; | 659 specialize qw/vpx_highbd_idct4x4_1_add/; |
| 642 | 660 |
| 643 add_proto qw/void vp9_highbd_idct8x8_1_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride, int bd"; | 661 add_proto qw/void vpx_highbd_idct8x8_1_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride, int bd"; |
| 644 specialize qw/vp9_highbd_idct8x8_1_add/; | 662 specialize qw/vpx_highbd_idct8x8_1_add/; |
| 645 | 663 |
| 646 add_proto qw/void vp9_highbd_idct16x16_1_add/, "const tran_low_t *input, uint8
_t *dest, int dest_stride, int bd"; | 664 add_proto qw/void vpx_highbd_idct16x16_1_add/, "const tran_low_t *input, uint8
_t *dest, int dest_stride, int bd"; |
| 647 specialize qw/vp9_highbd_idct16x16_1_add/; | 665 specialize qw/vpx_highbd_idct16x16_1_add/; |
| 648 | 666 |
| 649 add_proto qw/void vp9_highbd_idct32x32_1024_add/, "const tran_low_t *input, ui
nt8_t *dest, int dest_stride, int bd"; | 667 add_proto qw/void vpx_highbd_idct32x32_1024_add/, "const tran_low_t *input, ui
nt8_t *dest, int dest_stride, int bd"; |
| 650 specialize qw/vp9_highbd_idct32x32_1024_add/; | 668 specialize qw/vpx_highbd_idct32x32_1024_add/; |
| 651 | 669 |
| 652 add_proto qw/void vp9_highbd_idct32x32_34_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; | 670 add_proto qw/void vpx_highbd_idct32x32_34_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; |
| 653 specialize qw/vp9_highbd_idct32x32_34_add/; | 671 specialize qw/vpx_highbd_idct32x32_34_add/; |
| 654 | 672 |
| 655 add_proto qw/void vp9_highbd_idct32x32_1_add/, "const tran_low_t *input, uint8
_t *dest, int dest_stride, int bd"; | 673 add_proto qw/void vpx_highbd_idct32x32_1_add/, "const tran_low_t *input, uint8
_t *dest, int dest_stride, int bd"; |
| 656 specialize qw/vp9_highbd_idct32x32_1_add/; | 674 specialize qw/vpx_highbd_idct32x32_1_add/; |
| 657 | 675 |
| 658 add_proto qw/void vp9_highbd_iwht4x4_1_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride, int bd"; | 676 add_proto qw/void vpx_highbd_iwht4x4_1_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride, int bd"; |
| 659 specialize qw/vp9_highbd_iwht4x4_1_add/; | 677 specialize qw/vpx_highbd_iwht4x4_1_add/; |
| 660 | 678 |
| 661 add_proto qw/void vp9_highbd_iwht4x4_16_add/, "const tran_low_t *input, uint8_
t *dest, int dest_stride, int bd"; | 679 add_proto qw/void vpx_highbd_iwht4x4_16_add/, "const tran_low_t *input, uint8_
t *dest, int dest_stride, int bd"; |
| 662 specialize qw/vp9_highbd_iwht4x4_16_add/; | 680 specialize qw/vpx_highbd_iwht4x4_16_add/; |
| 663 | 681 |
| 664 # Force C versions if CONFIG_EMULATE_HARDWARE is 1 | 682 # Force C versions if CONFIG_EMULATE_HARDWARE is 1 |
| 665 if (vpx_config("CONFIG_EMULATE_HARDWARE") eq "yes") { | 683 if (vpx_config("CONFIG_EMULATE_HARDWARE") eq "yes") { |
| 666 add_proto qw/void vp9_highbd_idct4x4_16_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; | 684 add_proto qw/void vpx_highbd_idct4x4_16_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; |
| 667 specialize qw/vp9_highbd_idct4x4_16_add/; | 685 specialize qw/vpx_highbd_idct4x4_16_add/; |
| 668 | 686 |
| 669 add_proto qw/void vp9_highbd_idct8x8_64_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; | 687 add_proto qw/void vpx_highbd_idct8x8_64_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; |
| 670 specialize qw/vp9_highbd_idct8x8_64_add/; | 688 specialize qw/vpx_highbd_idct8x8_64_add/; |
| 671 | 689 |
| 672 add_proto qw/void vp9_highbd_idct8x8_10_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; | 690 add_proto qw/void vpx_highbd_idct8x8_10_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; |
| 673 specialize qw/vp9_highbd_idct8x8_10_add/; | 691 specialize qw/vpx_highbd_idct8x8_10_add/; |
| 674 | 692 |
| 675 add_proto qw/void vp9_highbd_idct16x16_256_add/, "const tran_low_t *input, u
int8_t *dest, int dest_stride, int bd"; | 693 add_proto qw/void vpx_highbd_idct16x16_256_add/, "const tran_low_t *input, u
int8_t *dest, int dest_stride, int bd"; |
| 676 specialize qw/vp9_highbd_idct16x16_256_add/; | 694 specialize qw/vpx_highbd_idct16x16_256_add/; |
| 677 | 695 |
| 678 add_proto qw/void vp9_highbd_idct16x16_10_add/, "const tran_low_t *input, ui
nt8_t *dest, int dest_stride, int bd"; | 696 add_proto qw/void vpx_highbd_idct16x16_10_add/, "const tran_low_t *input, ui
nt8_t *dest, int dest_stride, int bd"; |
| 679 specialize qw/vp9_highbd_idct16x16_10_add/; | 697 specialize qw/vpx_highbd_idct16x16_10_add/; |
| 680 } else { | 698 } else { |
| 681 add_proto qw/void vp9_highbd_idct4x4_16_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; | 699 add_proto qw/void vpx_highbd_idct4x4_16_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; |
| 682 specialize qw/vp9_highbd_idct4x4_16_add sse2/; | 700 specialize qw/vpx_highbd_idct4x4_16_add sse2/; |
| 683 | 701 |
| 684 add_proto qw/void vp9_highbd_idct8x8_64_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; | 702 add_proto qw/void vpx_highbd_idct8x8_64_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; |
| 685 specialize qw/vp9_highbd_idct8x8_64_add sse2/; | 703 specialize qw/vpx_highbd_idct8x8_64_add sse2/; |
| 686 | 704 |
| 687 add_proto qw/void vp9_highbd_idct8x8_10_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; | 705 add_proto qw/void vpx_highbd_idct8x8_10_add/, "const tran_low_t *input, uint
8_t *dest, int dest_stride, int bd"; |
| 688 specialize qw/vp9_highbd_idct8x8_10_add sse2/; | 706 specialize qw/vpx_highbd_idct8x8_10_add sse2/; |
| 689 | 707 |
| 690 add_proto qw/void vp9_highbd_idct16x16_256_add/, "const tran_low_t *input, u
int8_t *dest, int dest_stride, int bd"; | 708 add_proto qw/void vpx_highbd_idct16x16_256_add/, "const tran_low_t *input, u
int8_t *dest, int dest_stride, int bd"; |
| 691 specialize qw/vp9_highbd_idct16x16_256_add sse2/; | 709 specialize qw/vpx_highbd_idct16x16_256_add sse2/; |
| 692 | 710 |
| 693 add_proto qw/void vp9_highbd_idct16x16_10_add/, "const tran_low_t *input, ui
nt8_t *dest, int dest_stride, int bd"; | 711 add_proto qw/void vpx_highbd_idct16x16_10_add/, "const tran_low_t *input, ui
nt8_t *dest, int dest_stride, int bd"; |
| 694 specialize qw/vp9_highbd_idct16x16_10_add sse2/; | 712 specialize qw/vpx_highbd_idct16x16_10_add sse2/; |
| 695 } # CONFIG_EMULATE_HARDWARE | 713 } # CONFIG_EMULATE_HARDWARE |
| 696 } else { | 714 } else { |
| 697 # Force C versions if CONFIG_EMULATE_HARDWARE is 1 | 715 # Force C versions if CONFIG_EMULATE_HARDWARE is 1 |
| 698 if (vpx_config("CONFIG_EMULATE_HARDWARE") eq "yes") { | 716 if (vpx_config("CONFIG_EMULATE_HARDWARE") eq "yes") { |
| 699 add_proto qw/void vp9_idct4x4_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; | 717 add_proto qw/void vpx_idct4x4_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; |
| 700 specialize qw/vp9_idct4x4_1_add/; | 718 specialize qw/vpx_idct4x4_1_add/; |
| 701 | 719 |
| 702 add_proto qw/void vp9_idct4x4_16_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 720 add_proto qw/void vpx_idct4x4_16_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 703 specialize qw/vp9_idct4x4_16_add/; | 721 specialize qw/vpx_idct4x4_16_add/; |
| 704 | 722 |
| 705 add_proto qw/void vp9_idct8x8_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; | 723 add_proto qw/void vpx_idct8x8_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; |
| 706 specialize qw/vp9_idct8x8_1_add/; | 724 specialize qw/vpx_idct8x8_1_add/; |
| 707 | 725 |
| 708 add_proto qw/void vp9_idct8x8_64_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 726 add_proto qw/void vpx_idct8x8_64_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 709 specialize qw/vp9_idct8x8_64_add/; | 727 specialize qw/vpx_idct8x8_64_add/; |
| 710 | 728 |
| 711 add_proto qw/void vp9_idct8x8_12_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 729 add_proto qw/void vpx_idct8x8_12_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 712 specialize qw/vp9_idct8x8_12_add/; | 730 specialize qw/vpx_idct8x8_12_add/; |
| 713 | 731 |
| 714 add_proto qw/void vp9_idct16x16_1_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; | 732 add_proto qw/void vpx_idct16x16_1_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; |
| 715 specialize qw/vp9_idct16x16_1_add/; | 733 specialize qw/vpx_idct16x16_1_add/; |
| 716 | 734 |
| 717 add_proto qw/void vp9_idct16x16_256_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride"; | 735 add_proto qw/void vpx_idct16x16_256_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride"; |
| 718 specialize qw/vp9_idct16x16_256_add/; | 736 specialize qw/vpx_idct16x16_256_add/; |
| 719 | 737 |
| 720 add_proto qw/void vp9_idct16x16_10_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; | 738 add_proto qw/void vpx_idct16x16_10_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; |
| 721 specialize qw/vp9_idct16x16_10_add/; | 739 specialize qw/vpx_idct16x16_10_add/; |
| 722 | 740 |
| 723 add_proto qw/void vp9_idct32x32_1024_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride"; | 741 add_proto qw/void vpx_idct32x32_1024_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride"; |
| 724 specialize qw/vp9_idct32x32_1024_add/; | 742 specialize qw/vpx_idct32x32_1024_add/; |
| 725 | 743 |
| 726 add_proto qw/void vp9_idct32x32_34_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; | 744 add_proto qw/void vpx_idct32x32_34_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; |
| 727 specialize qw/vp9_idct32x32_34_add/; | 745 specialize qw/vpx_idct32x32_34_add/; |
| 728 | 746 |
| 729 add_proto qw/void vp9_idct32x32_1_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; | 747 add_proto qw/void vpx_idct32x32_1_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; |
| 730 specialize qw/vp9_idct32x32_1_add/; | 748 specialize qw/vpx_idct32x32_1_add/; |
| 731 | 749 |
| 732 add_proto qw/void vp9_iwht4x4_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; | 750 add_proto qw/void vpx_iwht4x4_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; |
| 733 specialize qw/vp9_iwht4x4_1_add/; | 751 specialize qw/vpx_iwht4x4_1_add/; |
| 734 | 752 |
| 735 add_proto qw/void vp9_iwht4x4_16_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 753 add_proto qw/void vpx_iwht4x4_16_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 736 specialize qw/vp9_iwht4x4_16_add/; | 754 specialize qw/vpx_iwht4x4_16_add/; |
| 737 } else { | 755 } else { |
| 738 add_proto qw/void vp9_idct4x4_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; | 756 add_proto qw/void vpx_idct4x4_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; |
| 739 specialize qw/vp9_idct4x4_1_add sse2 neon dspr2 msa/; | 757 specialize qw/vpx_idct4x4_1_add sse2 neon dspr2 msa/; |
| 740 | 758 |
| 741 add_proto qw/void vp9_idct4x4_16_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 759 add_proto qw/void vpx_idct4x4_16_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 742 specialize qw/vp9_idct4x4_16_add sse2 neon dspr2 msa/; | 760 specialize qw/vpx_idct4x4_16_add sse2 neon dspr2 msa/; |
| 743 | 761 |
| 744 add_proto qw/void vp9_idct8x8_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; | 762 add_proto qw/void vpx_idct8x8_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; |
| 745 specialize qw/vp9_idct8x8_1_add sse2 neon dspr2 msa/; | 763 specialize qw/vpx_idct8x8_1_add sse2 neon dspr2 msa/; |
| 746 | 764 |
| 747 add_proto qw/void vp9_idct8x8_64_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 765 add_proto qw/void vpx_idct8x8_64_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 748 specialize qw/vp9_idct8x8_64_add sse2 neon dspr2 msa/, "$ssse3_x86_64_x86inc
"; | 766 specialize qw/vpx_idct8x8_64_add sse2 neon dspr2 msa/, "$ssse3_x86_64_x86inc
"; |
| 749 | 767 |
| 750 add_proto qw/void vp9_idct8x8_12_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 768 add_proto qw/void vpx_idct8x8_12_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 751 specialize qw/vp9_idct8x8_12_add sse2 neon dspr2 msa/, "$ssse3_x86_64_x86inc
"; | 769 specialize qw/vpx_idct8x8_12_add sse2 neon dspr2 msa/, "$ssse3_x86_64_x86inc
"; |
| 752 | 770 |
| 753 add_proto qw/void vp9_idct16x16_1_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; | 771 add_proto qw/void vpx_idct16x16_1_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; |
| 754 specialize qw/vp9_idct16x16_1_add sse2 neon dspr2 msa/; | 772 specialize qw/vpx_idct16x16_1_add sse2 neon dspr2 msa/; |
| 755 | 773 |
| 756 add_proto qw/void vp9_idct16x16_256_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride"; | 774 add_proto qw/void vpx_idct16x16_256_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride"; |
| 757 specialize qw/vp9_idct16x16_256_add sse2 neon dspr2 msa/; | 775 specialize qw/vpx_idct16x16_256_add sse2 neon dspr2 msa/; |
| 758 | 776 |
| 759 add_proto qw/void vp9_idct16x16_10_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; | 777 add_proto qw/void vpx_idct16x16_10_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; |
| 760 specialize qw/vp9_idct16x16_10_add sse2 neon dspr2 msa/; | 778 specialize qw/vpx_idct16x16_10_add sse2 neon dspr2 msa/; |
| 761 | 779 |
| 762 add_proto qw/void vp9_idct32x32_1024_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride"; | 780 add_proto qw/void vpx_idct32x32_1024_add/, "const tran_low_t *input, uint8_t
*dest, int dest_stride"; |
| 763 specialize qw/vp9_idct32x32_1024_add sse2 neon dspr2 msa/; | 781 specialize qw/vpx_idct32x32_1024_add sse2 neon dspr2 msa/; |
| 764 | 782 |
| 765 add_proto qw/void vp9_idct32x32_34_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; | 783 add_proto qw/void vpx_idct32x32_34_add/, "const tran_low_t *input, uint8_t *
dest, int dest_stride"; |
| 766 specialize qw/vp9_idct32x32_34_add sse2 neon_asm dspr2 msa/; | 784 specialize qw/vpx_idct32x32_34_add sse2 neon_asm dspr2 msa/; |
| 767 # Need to add 34 eob idct32x32 neon implementation. | 785 # Need to add 34 eob idct32x32 neon implementation. |
| 768 $vp9_idct32x32_34_add_neon_asm=vp9_idct32x32_1024_add_neon; | 786 $vpx_idct32x32_34_add_neon_asm=vpx_idct32x32_1024_add_neon; |
| 769 | 787 |
| 770 add_proto qw/void vp9_idct32x32_1_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; | 788 add_proto qw/void vpx_idct32x32_1_add/, "const tran_low_t *input, uint8_t *d
est, int dest_stride"; |
| 771 specialize qw/vp9_idct32x32_1_add sse2 neon dspr2 msa/; | 789 specialize qw/vpx_idct32x32_1_add sse2 neon dspr2 msa/; |
| 772 | 790 |
| 773 add_proto qw/void vp9_iwht4x4_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; | 791 add_proto qw/void vpx_iwht4x4_1_add/, "const tran_low_t *input, uint8_t *des
t, int dest_stride"; |
| 774 specialize qw/vp9_iwht4x4_1_add msa/; | 792 specialize qw/vpx_iwht4x4_1_add msa/; |
| 775 | 793 |
| 776 add_proto qw/void vp9_iwht4x4_16_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; | 794 add_proto qw/void vpx_iwht4x4_16_add/, "const tran_low_t *input, uint8_t *de
st, int dest_stride"; |
| 777 specialize qw/vp9_iwht4x4_16_add msa/, "$sse2_x86inc"; | 795 specialize qw/vpx_iwht4x4_16_add msa/, "$sse2_x86inc"; |
| 778 } # CONFIG_EMULATE_HARDWARE | 796 } # CONFIG_EMULATE_HARDWARE |
| 779 } # CONFIG_VP9_HIGHBITDEPTH | 797 } # CONFIG_VP9_HIGHBITDEPTH |
| 780 } # CONFIG_VP9 | 798 } # CONFIG_VP9 || CONFIG_VP10 |
| 781 | 799 |
| 782 # | 800 # |
| 783 # Quantization | 801 # Quantization |
| 784 # | 802 # |
| 785 if (vpx_config("CONFIG_VP9_ENCODER") eq "yes") { | 803 if ((vpx_config("CONFIG_VP9_ENCODER") eq "yes") || (vpx_config("CONFIG_VP10_ENCO
DER") eq "yes")) { |
| 786 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { | 804 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { |
| 787 add_proto qw/void vp9_quantize_b/, "const tran_low_t *coeff_ptr, intptr_t n_co
effs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const i
nt16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_
low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t
*scan, const int16_t *iscan"; | 805 add_proto qw/void vpx_quantize_b/, "const tran_low_t *coeff_ptr, intptr_t n_co
effs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const i
nt16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_
low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t
*scan, const int16_t *iscan"; |
| 788 specialize qw/vp9_quantize_b/; | 806 specialize qw/vpx_quantize_b/; |
| 789 | 807 |
| 790 add_proto qw/void vp9_quantize_b_32x32/, "const tran_low_t *coeff_ptr, intptr_
t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, c
onst int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr,
tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const i
nt16_t *scan, const int16_t *iscan"; | 808 add_proto qw/void vpx_quantize_b_32x32/, "const tran_low_t *coeff_ptr, intptr_
t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, c
onst int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr,
tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const i
nt16_t *scan, const int16_t *iscan"; |
| 791 specialize qw/vp9_quantize_b_32x32/; | 809 specialize qw/vpx_quantize_b_32x32/; |
| 792 | 810 |
| 793 add_proto qw/void vp9_highbd_quantize_b/, "const tran_low_t *coeff_ptr, intptr
_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr,
const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr
, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const
int16_t *scan, const int16_t *iscan"; | 811 add_proto qw/void vpx_highbd_quantize_b/, "const tran_low_t *coeff_ptr, intptr
_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr,
const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr
, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const
int16_t *scan, const int16_t *iscan"; |
| 794 specialize qw/vp9_highbd_quantize_b sse2/; | 812 specialize qw/vpx_highbd_quantize_b sse2/; |
| 795 | 813 |
| 796 add_proto qw/void vp9_highbd_quantize_b_32x32/, "const tran_low_t *coeff_ptr,
intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round
_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoe
ff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr,
const int16_t *scan, const int16_t *iscan"; | 814 add_proto qw/void vpx_highbd_quantize_b_32x32/, "const tran_low_t *coeff_ptr,
intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round
_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoe
ff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr,
const int16_t *scan, const int16_t *iscan"; |
| 797 specialize qw/vp9_highbd_quantize_b_32x32 sse2/; | 815 specialize qw/vpx_highbd_quantize_b_32x32 sse2/; |
| 798 } else { | 816 } else { |
| 799 add_proto qw/void vp9_quantize_b/, "const tran_low_t *coeff_ptr, intptr_t n_co
effs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const i
nt16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_
low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t
*scan, const int16_t *iscan"; | 817 add_proto qw/void vpx_quantize_b/, "const tran_low_t *coeff_ptr, intptr_t n_co
effs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const i
nt16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_
low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t
*scan, const int16_t *iscan"; |
| 800 specialize qw/vp9_quantize_b sse2/, "$ssse3_x86_64_x86inc"; | 818 specialize qw/vpx_quantize_b sse2/, "$ssse3_x86_64_x86inc"; |
| 801 | 819 |
| 802 add_proto qw/void vp9_quantize_b_32x32/, "const tran_low_t *coeff_ptr, intptr_
t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, c
onst int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr,
tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const i
nt16_t *scan, const int16_t *iscan"; | 820 add_proto qw/void vpx_quantize_b_32x32/, "const tran_low_t *coeff_ptr, intptr_
t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, c
onst int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr,
tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const i
nt16_t *scan, const int16_t *iscan"; |
| 803 specialize qw/vp9_quantize_b_32x32/, "$ssse3_x86_64_x86inc"; | 821 specialize qw/vpx_quantize_b_32x32/, "$ssse3_x86_64_x86inc"; |
| 804 } # CONFIG_VP9_ENCODER | |
| 805 } # CONFIG_VP9_HIGHBITDEPTH | 822 } # CONFIG_VP9_HIGHBITDEPTH |
| 823 } # CONFIG_VP9_ENCODER || CONFIG_VP10_ENCODER |
| 806 | 824 |
| 807 if (vpx_config("CONFIG_ENCODERS") eq "yes") { | 825 if (vpx_config("CONFIG_ENCODERS") eq "yes") { |
| 808 # | 826 # |
| 809 # Block subtraction | 827 # Block subtraction |
| 810 # | 828 # |
| 811 add_proto qw/void vpx_subtract_block/, "int rows, int cols, int16_t *diff_ptr, p
trdiff_t diff_stride, const uint8_t *src_ptr, ptrdiff_t src_stride, const uint8_
t *pred_ptr, ptrdiff_t pred_stride"; | 829 add_proto qw/void vpx_subtract_block/, "int rows, int cols, int16_t *diff_ptr, p
trdiff_t diff_stride, const uint8_t *src_ptr, ptrdiff_t src_stride, const uint8_
t *pred_ptr, ptrdiff_t pred_stride"; |
| 812 specialize qw/vpx_subtract_block neon msa/, "$sse2_x86inc"; | 830 specialize qw/vpx_subtract_block neon msa/, "$sse2_x86inc"; |
| 813 | 831 |
| 814 # | 832 # |
| 815 # Single block SAD | 833 # Single block SAD |
| (...skipping 167 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 983 | 1001 |
| 984 add_proto qw/void vpx_sad8x4x4d/, "const uint8_t *src_ptr, int src_stride, const
uint8_t * const ref_ptr[], int ref_stride, uint32_t *sad_array"; | 1002 add_proto qw/void vpx_sad8x4x4d/, "const uint8_t *src_ptr, int src_stride, const
uint8_t * const ref_ptr[], int ref_stride, uint32_t *sad_array"; |
| 985 specialize qw/vpx_sad8x4x4d msa/, "$sse2_x86inc"; | 1003 specialize qw/vpx_sad8x4x4d msa/, "$sse2_x86inc"; |
| 986 | 1004 |
| 987 add_proto qw/void vpx_sad4x8x4d/, "const uint8_t *src_ptr, int src_stride, const
uint8_t * const ref_ptr[], int ref_stride, uint32_t *sad_array"; | 1005 add_proto qw/void vpx_sad4x8x4d/, "const uint8_t *src_ptr, int src_stride, const
uint8_t * const ref_ptr[], int ref_stride, uint32_t *sad_array"; |
| 988 specialize qw/vpx_sad4x8x4d msa/, "$sse_x86inc"; | 1006 specialize qw/vpx_sad4x8x4d msa/, "$sse_x86inc"; |
| 989 | 1007 |
| 990 add_proto qw/void vpx_sad4x4x4d/, "const uint8_t *src_ptr, int src_stride, const
uint8_t * const ref_ptr[], int ref_stride, uint32_t *sad_array"; | 1008 add_proto qw/void vpx_sad4x4x4d/, "const uint8_t *src_ptr, int src_stride, const
uint8_t * const ref_ptr[], int ref_stride, uint32_t *sad_array"; |
| 991 specialize qw/vpx_sad4x4x4d msa/, "$sse_x86inc"; | 1009 specialize qw/vpx_sad4x4x4d msa/, "$sse_x86inc"; |
| 992 | 1010 |
| 1011 # |
| 1012 # Structured Similarity (SSIM) |
| 1013 # |
| 1014 if (vpx_config("CONFIG_INTERNAL_STATS") eq "yes") { |
| 1015 add_proto qw/void vpx_ssim_parms_8x8/, "const uint8_t *s, int sp, const uint
8_t *r, int rp, uint32_t *sum_s, uint32_t *sum_r, uint32_t *sum_sq_s, uint32_t *
sum_sq_r, uint32_t *sum_sxr"; |
| 1016 specialize qw/vpx_ssim_parms_8x8/, "$sse2_x86_64"; |
| 1017 |
| 1018 add_proto qw/void vpx_ssim_parms_16x16/, "const uint8_t *s, int sp, const ui
nt8_t *r, int rp, uint32_t *sum_s, uint32_t *sum_r, uint32_t *sum_sq_s, uint32_t
*sum_sq_r, uint32_t *sum_sxr"; |
| 1019 specialize qw/vpx_ssim_parms_16x16/, "$sse2_x86_64"; |
| 1020 } |
| 1021 |
| 993 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { | 1022 if (vpx_config("CONFIG_VP9_HIGHBITDEPTH") eq "yes") { |
| 994 # | 1023 # |
| 995 # Block subtraction | 1024 # Block subtraction |
| 996 # | 1025 # |
| 997 add_proto qw/void vpx_highbd_subtract_block/, "int rows, int cols, int16_t *di
ff_ptr, ptrdiff_t diff_stride, const uint8_t *src_ptr, ptrdiff_t src_stride, con
st uint8_t *pred_ptr, ptrdiff_t pred_stride, int bd"; | 1026 add_proto qw/void vpx_highbd_subtract_block/, "int rows, int cols, int16_t *di
ff_ptr, ptrdiff_t diff_stride, const uint8_t *src_ptr, ptrdiff_t src_stride, con
st uint8_t *pred_ptr, ptrdiff_t pred_stride, int bd"; |
| 998 specialize qw/vpx_highbd_subtract_block/; | 1027 specialize qw/vpx_highbd_subtract_block/; |
| 999 | 1028 |
| 1000 # | 1029 # |
| 1001 # Single block SAD | 1030 # Single block SAD |
| 1002 # | 1031 # |
| (...skipping 166 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 1169 | 1198 |
| 1170 add_proto qw/void vpx_highbd_sad8x4x4d/, "const uint8_t *src_ptr, int src_stri
de, const uint8_t* const ref_ptr[], int ref_stride, uint32_t *sad_array"; | 1199 add_proto qw/void vpx_highbd_sad8x4x4d/, "const uint8_t *src_ptr, int src_stri
de, const uint8_t* const ref_ptr[], int ref_stride, uint32_t *sad_array"; |
| 1171 specialize qw/vpx_highbd_sad8x4x4d/, "$sse2_x86inc"; | 1200 specialize qw/vpx_highbd_sad8x4x4d/, "$sse2_x86inc"; |
| 1172 | 1201 |
| 1173 add_proto qw/void vpx_highbd_sad4x8x4d/, "const uint8_t *src_ptr, int src_stri
de, const uint8_t* const ref_ptr[], int ref_stride, uint32_t *sad_array"; | 1202 add_proto qw/void vpx_highbd_sad4x8x4d/, "const uint8_t *src_ptr, int src_stri
de, const uint8_t* const ref_ptr[], int ref_stride, uint32_t *sad_array"; |
| 1174 specialize qw/vpx_highbd_sad4x8x4d/, "$sse2_x86inc"; | 1203 specialize qw/vpx_highbd_sad4x8x4d/, "$sse2_x86inc"; |
| 1175 | 1204 |
| 1176 add_proto qw/void vpx_highbd_sad4x4x4d/, "const uint8_t *src_ptr, int src_stri
de, const uint8_t* const ref_ptr[], int ref_stride, uint32_t *sad_array"; | 1205 add_proto qw/void vpx_highbd_sad4x4x4d/, "const uint8_t *src_ptr, int src_stri
de, const uint8_t* const ref_ptr[], int ref_stride, uint32_t *sad_array"; |
| 1177 specialize qw/vpx_highbd_sad4x4x4d/, "$sse2_x86inc"; | 1206 specialize qw/vpx_highbd_sad4x4x4d/, "$sse2_x86inc"; |
| 1178 | 1207 |
| 1208 # |
| 1209 # Structured Similarity (SSIM) |
| 1210 # |
| 1211 if (vpx_config("CONFIG_INTERNAL_STATS") eq "yes") { |
| 1212 add_proto qw/void vpx_highbd_ssim_parms_8x8/, "const uint16_t *s, int sp, co
nst uint16_t *r, int rp, uint32_t *sum_s, uint32_t *sum_r, uint32_t *sum_sq_s, u
int32_t *sum_sq_r, uint32_t *sum_sxr"; |
| 1213 specialize qw/vpx_highbd_ssim_parms_8x8/; |
| 1214 } |
| 1179 } # CONFIG_VP9_HIGHBITDEPTH | 1215 } # CONFIG_VP9_HIGHBITDEPTH |
| 1180 } # CONFIG_ENCODERS | 1216 } # CONFIG_ENCODERS |
| 1181 | 1217 |
| 1182 if (vpx_config("CONFIG_ENCODERS") eq "yes" || vpx_config("CONFIG_POSTPROC") eq "
yes" || vpx_config("CONFIG_VP9_POSTPROC") eq "yes") { | 1218 if (vpx_config("CONFIG_ENCODERS") eq "yes" || vpx_config("CONFIG_POSTPROC") eq "
yes" || vpx_config("CONFIG_VP9_POSTPROC") eq "yes") { |
| 1183 | 1219 |
| 1184 # | 1220 # |
| 1185 # Variance | 1221 # Variance |
| 1186 # | 1222 # |
| 1187 add_proto qw/unsigned int vpx_variance64x64/, "const uint8_t *src_ptr, int sourc
e_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; | 1223 add_proto qw/unsigned int vpx_variance64x64/, "const uint8_t *src_ptr, int sourc
e_stride, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse"; |
| 1188 specialize qw/vpx_variance64x64 sse2 avx2 neon msa/; | 1224 specialize qw/vpx_variance64x64 sse2 avx2 neon msa/; |
| (...skipping 510 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 1699 add_proto qw/uint32_t vpx_highbd_8_sub_pixel_avg_variance8x4/, "const uint8_t
*src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr,
int ref_stride, uint32_t *sse, const uint8_t *second_pred"; | 1735 add_proto qw/uint32_t vpx_highbd_8_sub_pixel_avg_variance8x4/, "const uint8_t
*src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr,
int ref_stride, uint32_t *sse, const uint8_t *second_pred"; |
| 1700 specialize qw/vpx_highbd_8_sub_pixel_avg_variance8x4/, "$sse2_x86inc"; | 1736 specialize qw/vpx_highbd_8_sub_pixel_avg_variance8x4/, "$sse2_x86inc"; |
| 1701 | 1737 |
| 1702 add_proto qw/uint32_t vpx_highbd_8_sub_pixel_avg_variance4x8/, "const uint8_t
*src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr,
int ref_stride, uint32_t *sse, const uint8_t *second_pred"; | 1738 add_proto qw/uint32_t vpx_highbd_8_sub_pixel_avg_variance4x8/, "const uint8_t
*src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr,
int ref_stride, uint32_t *sse, const uint8_t *second_pred"; |
| 1703 add_proto qw/uint32_t vpx_highbd_8_sub_pixel_avg_variance4x4/, "const uint8_t
*src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr,
int ref_stride, uint32_t *sse, const uint8_t *second_pred"; | 1739 add_proto qw/uint32_t vpx_highbd_8_sub_pixel_avg_variance4x4/, "const uint8_t
*src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr,
int ref_stride, uint32_t *sse, const uint8_t *second_pred"; |
| 1704 | 1740 |
| 1705 } # CONFIG_VP9_HIGHBITDEPTH | 1741 } # CONFIG_VP9_HIGHBITDEPTH |
| 1706 } # CONFIG_ENCODERS || CONFIG_POSTPROC || CONFIG_VP9_POSTPROC | 1742 } # CONFIG_ENCODERS || CONFIG_POSTPROC || CONFIG_VP9_POSTPROC |
| 1707 | 1743 |
| 1708 1; | 1744 1; |
| OLD | NEW |