2014-02-24 01:33:14 +01:00
sub vp9_common_forward_decls () {
print << EOF
/ *
* VP9
* /
#include "vpx/vpx_integer.h"
2014-09-30 23:29:34 +02:00
#include "vp9/common/vp9_common.h"
2014-02-24 01:33:14 +01:00
#include "vp9/common/vp9_enums.h"
struct macroblockd ;
/* Encoder forward decls */
struct macroblock ;
struct vp9_variance_vtable ;
2014-04-26 03:22:27 +02:00
struct search_site_config ;
2014-02-24 01:33:14 +01:00
struct mv ;
union int_mv ;
struct yv12_buffer_config ;
EOF
}
forward_decls qw/vp9_common_forward_decls/ ;
# x86inc.asm doesn't work if pic is enabled on 32 bit platforms so no assembly.
if ( vpx_config ( "CONFIG_USE_X86INC" ) eq "yes" ) {
$ mmx_x86inc = 'mmx' ;
$ sse_x86inc = 'sse' ;
$ sse2_x86inc = 'sse2' ;
$ ssse3_x86inc = 'ssse3' ;
$ avx_x86inc = 'avx' ;
$ avx2_x86inc = 'avx2' ;
} else {
$ mmx_x86inc = $ sse_x86inc = $ sse2_x86inc = $ ssse3_x86inc =
$ avx_x86inc = $ avx2_x86inc = '' ;
}
# this variable is for functions that are 64 bit only.
if ( $ opts { arch } eq "x86_64" ) {
$ mmx_x86_64 = 'mmx' ;
$ sse2_x86_64 = 'sse2' ;
$ ssse3_x86_64 = 'ssse3' ;
$ avx_x86_64 = 'avx' ;
$ avx2_x86_64 = 'avx2' ;
} else {
$ mmx_x86_64 = $ sse2_x86_64 = $ ssse3_x86_64 =
$ avx_x86_64 = $ avx2_x86_64 = '' ;
}
2014-09-10 19:27:58 +02:00
# optimizations which depend on multiple features
if ( ( vpx_config ( "HAVE_AVX2" ) eq "yes" ) && ( vpx_config ( "HAVE_SSSE3" ) eq "yes" ) ) {
$ avx2_ssse3 = 'avx2' ;
} else {
$ avx2_ssse3 = '' ;
}
2014-02-24 01:33:14 +01:00
#
# RECON
#
add_proto qw/void vp9_d207_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d207_predictor_4x4/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_d45_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d45_predictor_4x4/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_d63_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d63_predictor_4x4/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_h_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_h_predictor_4x4 neon dspr2/ , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_d117_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d117_predictor_4x4/ ;
add_proto qw/void vp9_d135_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d135_predictor_4x4/ ;
add_proto qw/void vp9_d153_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d153_predictor_4x4/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_v_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_v_predictor_4x4 neon/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_tm_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_tm_predictor_4x4 neon dspr2/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_dc_predictor_4x4 dspr2/ , "$sse_x86inc" ;
add_proto qw/void vp9_dc_top_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-01 00:42:57 +02:00
specialize qw/vp9_dc_top_predictor_4x4/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_left_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-01 00:42:57 +02:00
specialize qw/vp9_dc_left_predictor_4x4/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_128_predictor_4x4/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-01 00:42:57 +02:00
specialize qw/vp9_dc_128_predictor_4x4/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_d207_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d207_predictor_8x8/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_d45_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d45_predictor_8x8/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_d63_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d63_predictor_8x8/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_h_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_h_predictor_8x8 neon dspr2/ , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_d117_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d117_predictor_8x8/ ;
add_proto qw/void vp9_d135_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d135_predictor_8x8/ ;
add_proto qw/void vp9_d153_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d153_predictor_8x8/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_v_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_v_predictor_8x8 neon/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_tm_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_tm_predictor_8x8 neon dspr2/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-28 03:59:57 +02:00
specialize qw/vp9_dc_predictor_8x8 dspr2 neon/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_top_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-28 03:59:57 +02:00
specialize qw/vp9_dc_top_predictor_8x8 neon/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_left_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-28 03:59:57 +02:00
specialize qw/vp9_dc_left_predictor_8x8 neon/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_128_predictor_8x8/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-28 03:59:57 +02:00
specialize qw/vp9_dc_128_predictor_8x8 neon/ , "$sse_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_d207_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d207_predictor_16x16/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_d45_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d45_predictor_16x16/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_d63_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d63_predictor_16x16/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_h_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_h_predictor_16x16 neon dspr2/ , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_d117_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d117_predictor_16x16/ ;
add_proto qw/void vp9_d135_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d135_predictor_16x16/ ;
add_proto qw/void vp9_d153_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d153_predictor_16x16/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_v_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_v_predictor_16x16 neon/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_tm_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_tm_predictor_16x16 neon/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-28 05:17:27 +02:00
specialize qw/vp9_dc_predictor_16x16 dspr2 neon/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_top_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-28 05:17:27 +02:00
specialize qw/vp9_dc_top_predictor_16x16 neon/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_left_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-28 05:17:27 +02:00
specialize qw/vp9_dc_left_predictor_16x16 neon/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_128_predictor_16x16/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-28 05:17:27 +02:00
specialize qw/vp9_dc_128_predictor_16x16 neon/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_d207_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d207_predictor_32x32/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_d45_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d45_predictor_32x32/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_d63_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d63_predictor_32x32/ , "$ssse3_x86inc" ;
add_proto qw/void vp9_h_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_h_predictor_32x32 neon/ , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_d117_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d117_predictor_32x32/ ;
add_proto qw/void vp9_d135_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d135_predictor_32x32/ ;
add_proto qw/void vp9_d153_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_d153_predictor_32x32/ ;
add_proto qw/void vp9_v_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_v_predictor_32x32 neon/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_tm_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2014-02-08 18:01:36 +01:00
specialize qw/vp9_tm_predictor_32x32 neon/ , "$sse2_x86_64" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
specialize qw/vp9_dc_predictor_32x32/ , "$sse2_x86inc" ;
add_proto qw/void vp9_dc_top_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-06 00:21:28 +02:00
specialize qw/vp9_dc_top_predictor_32x32/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_left_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-06 00:21:28 +02:00
specialize qw/vp9_dc_left_predictor_32x32/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_dc_128_predictor_32x32/ , "uint8_t *dst, ptrdiff_t y_stride, const uint8_t *above, const uint8_t *left" ;
2015-05-06 00:21:28 +02:00
specialize qw/vp9_dc_128_predictor_32x32/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
#
# Loopfilter
#
add_proto qw/void vp9_lpf_vertical_16/ , "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh" ;
2015-06-04 08:20:41 +02:00
specialize qw/vp9_lpf_vertical_16 sse2 neon_asm dspr2 msa/ ;
2014-05-07 20:01:31 +02:00
$ vp9_lpf_vertical_16_neon_asm = vp9_lpf_vertical_16_neon ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_vertical_16_dual/ , "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh" ;
2015-06-04 08:20:41 +02:00
specialize qw/vp9_lpf_vertical_16_dual sse2 neon_asm dspr2 msa/ ;
2014-05-07 20:01:31 +02:00
$ vp9_lpf_vertical_16_dual_neon_asm = vp9_lpf_vertical_16_dual_neon ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_vertical_8/ , "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count" ;
2014-12-20 00:00:04 +01:00
specialize qw/vp9_lpf_vertical_8 sse2 neon_asm dspr2/ ;
$ vp9_lpf_vertical_8_neon_asm = vp9_lpf_vertical_8_neon ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_vertical_8_dual/ , "uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1" ;
2014-12-20 00:00:04 +01:00
specialize qw/vp9_lpf_vertical_8_dual sse2 neon_asm dspr2/ ;
$ vp9_lpf_vertical_8_dual_neon_asm = vp9_lpf_vertical_8_dual_neon ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_vertical_4/ , "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count" ;
2014-01-21 02:43:29 +01:00
specialize qw/vp9_lpf_vertical_4 mmx neon dspr2/ ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_vertical_4_dual/ , "uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1" ;
2014-01-21 02:43:29 +01:00
specialize qw/vp9_lpf_vertical_4_dual sse2 neon dspr2/ ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_horizontal_16/ , "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count" ;
2015-06-04 08:20:41 +02:00
specialize qw/vp9_lpf_horizontal_16 sse2 avx2 neon_asm dspr2 msa/ ;
2014-05-07 20:01:31 +02:00
$ vp9_lpf_horizontal_16_neon_asm = vp9_lpf_horizontal_16_neon ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_horizontal_8/ , "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count" ;
2014-12-20 00:00:04 +01:00
specialize qw/vp9_lpf_horizontal_8 sse2 neon_asm dspr2/ ;
$ vp9_lpf_horizontal_8_neon_asm = vp9_lpf_horizontal_8_neon ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_horizontal_8_dual/ , "uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1" ;
2014-12-20 00:00:04 +01:00
specialize qw/vp9_lpf_horizontal_8_dual sse2 neon_asm dspr2/ ;
$ vp9_lpf_horizontal_8_dual_neon_asm = vp9_lpf_horizontal_8_dual_neon ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_horizontal_4/ , "uint8_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count" ;
2014-01-21 02:43:29 +01:00
specialize qw/vp9_lpf_horizontal_4 mmx neon dspr2/ ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_lpf_horizontal_4_dual/ , "uint8_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1" ;
2014-02-08 05:06:21 +01:00
specialize qw/vp9_lpf_horizontal_4_dual sse2 neon dspr2/ ;
2014-02-24 01:33:14 +01:00
#
# post proc
#
if ( vpx_config ( "CONFIG_VP9_POSTPROC" ) eq "yes" ) {
add_proto qw/void vp9_mbpost_proc_down/ , "uint8_t *dst, int pitch, int rows, int cols, int flimit" ;
2014-09-05 20:52:24 +02:00
specialize qw/vp9_mbpost_proc_down sse2/ ;
2014-02-24 01:33:14 +01:00
$ vp9_mbpost_proc_down_sse2 = vp9_mbpost_proc_down_xmm ;
add_proto qw/void vp9_mbpost_proc_across_ip/ , "uint8_t *src, int pitch, int rows, int cols, int flimit" ;
specialize qw/vp9_mbpost_proc_across_ip sse2/ ;
$ vp9_mbpost_proc_across_ip_sse2 = vp9_mbpost_proc_across_ip_xmm ;
add_proto qw/void vp9_post_proc_down_and_across/ , "const uint8_t *src_ptr, uint8_t *dst_ptr, int src_pixels_per_line, int dst_pixels_per_line, int rows, int cols, int flimit" ;
2014-09-05 20:52:24 +02:00
specialize qw/vp9_post_proc_down_and_across sse2/ ;
2014-02-24 01:33:14 +01:00
$ vp9_post_proc_down_and_across_sse2 = vp9_post_proc_down_and_across_xmm ;
add_proto qw/void vp9_plane_add_noise/ , "uint8_t *Start, char *noise, char blackclamp[16], char whiteclamp[16], char bothclamp[16], unsigned int Width, unsigned int Height, int Pitch" ;
2014-09-05 20:52:24 +02:00
specialize qw/vp9_plane_add_noise sse2/ ;
2014-02-24 01:33:14 +01:00
$ vp9_plane_add_noise_sse2 = vp9_plane_add_noise_wmt ;
2015-01-13 19:50:50 +01:00
add_proto qw/void vp9_filter_by_weight16x16/ , "const uint8_t *src, int src_stride, uint8_t *dst, int dst_stride, int src_weight" ;
specialize qw/vp9_filter_by_weight16x16 sse2/ ;
add_proto qw/void vp9_filter_by_weight8x8/ , "const uint8_t *src, int src_stride, uint8_t *dst, int dst_stride, int src_weight" ;
specialize qw/vp9_filter_by_weight8x8 sse2/ ;
2014-02-24 01:33:14 +01:00
}
#
# Sub Pixel Filters
#
add_proto qw/void vp9_convolve_copy/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h" ;
2015-06-02 06:59:56 +02:00
specialize qw/vp9_convolve_copy neon dspr2 msa/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_convolve_avg/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h" ;
2015-06-02 06:59:56 +02:00
specialize qw/vp9_convolve_avg neon dspr2 msa/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_convolve8/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h" ;
2015-06-02 06:59:56 +02:00
specialize qw/vp9_convolve8 sse2 ssse3 neon dspr2 msa/ , "$avx2_ssse3" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_convolve8_horiz/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h" ;
2015-06-02 06:59:56 +02:00
specialize qw/vp9_convolve8_horiz sse2 ssse3 neon dspr2 msa/ , "$avx2_ssse3" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_convolve8_vert/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h" ;
2015-06-02 06:59:56 +02:00
specialize qw/vp9_convolve8_vert sse2 ssse3 neon dspr2 msa/ , "$avx2_ssse3" ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_convolve8_avg/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h" ;
2015-06-04 04:41:01 +02:00
specialize qw/vp9_convolve8_avg sse2 ssse3 neon dspr2 msa/ ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_convolve8_avg_horiz/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h" ;
2015-06-03 08:03:42 +02:00
specialize qw/vp9_convolve8_avg_horiz sse2 ssse3 neon dspr2 msa/ ;
2014-02-24 01:33:14 +01:00
add_proto qw/void vp9_convolve8_avg_vert/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h" ;
2015-06-03 06:25:25 +02:00
specialize qw/vp9_convolve8_avg_vert sse2 ssse3 neon dspr2 msa/ ;
2014-02-24 01:33:14 +01:00
#
# dct
#
2014-09-03 01:34:09 +02:00
if ( vpx_config ( "CONFIG_VP9_HIGHBITDEPTH" ) eq "yes" ) {
2014-10-03 00:43:27 +02:00
# Note as optimized versions of these functions are added we need to add a check to ensure
# that when CONFIG_EMULATE_HARDWARE is on, it defaults to the C versions only.
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_idct4x4_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct4x4_1_add/ ;
add_proto qw/void vp9_idct4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct4x4_16_add/ ;
add_proto qw/void vp9_idct8x8_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct8x8_1_add/ ;
add_proto qw/void vp9_idct8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct8x8_64_add/ ;
add_proto qw/void vp9_idct8x8_12_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct8x8_12_add/ ;
add_proto qw/void vp9_idct16x16_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct16x16_1_add/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_idct16x16_256_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct16x16_256_add/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_idct16x16_10_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct16x16_10_add/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_idct32x32_1024_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct32x32_1024_add/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_idct32x32_34_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct32x32_34_add/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_idct32x32_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct32x32_1_add/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_iht4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type" ;
specialize qw/vp9_iht4x4_16_add/ ;
add_proto qw/void vp9_iht8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type" ;
specialize qw/vp9_iht8x8_64_add/ ;
add_proto qw/void vp9_iht16x16_256_add/ , "const tran_low_t *input, uint8_t *output, int pitch, int tx_type" ;
specialize qw/vp9_iht16x16_256_add/ ;
# dct and add
add_proto qw/void vp9_iwht4x4_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_iwht4x4_1_add/ ;
add_proto qw/void vp9_iwht4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_iwht4x4_16_add/ ;
2014-10-03 00:43:27 +02:00
2014-09-03 01:34:09 +02:00
} else {
2014-10-03 00:43:27 +02:00
# Force C versions if CONFIG_EMULATE_HARDWARE is 1
if ( vpx_config ( "CONFIG_EMULATE_HARDWARE" ) eq "yes" ) {
add_proto qw/void vp9_idct4x4_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct4x4_1_add/ ;
2014-02-24 01:33:14 +01:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct4x4_16_add/ ;
2014-02-24 01:33:14 +01:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct8x8_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct8x8_1_add/ ;
2014-02-24 01:33:14 +01:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct8x8_64_add/ ;
2014-02-24 01:33:14 +01:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct8x8_12_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct8x8_12_add/ ;
2014-02-24 01:33:14 +01:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct16x16_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct16x16_1_add/ ;
2014-02-24 01:33:14 +01:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct16x16_256_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct16x16_256_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct16x16_10_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct16x16_10_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct32x32_1024_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct32x32_1024_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct32x32_34_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct32x32_34_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct32x32_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_idct32x32_1_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iht4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type" ;
specialize qw/vp9_iht4x4_16_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iht8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type" ;
specialize qw/vp9_iht8x8_64_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iht16x16_256_add/ , "const tran_low_t *input, uint8_t *output, int pitch, int tx_type" ;
specialize qw/vp9_iht16x16_256_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
# dct and add
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iwht4x4_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_iwht4x4_1_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iwht4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
specialize qw/vp9_iwht4x4_16_add/ ;
} else {
add_proto qw/void vp9_idct4x4_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-02 08:46:28 +02:00
specialize qw/vp9_idct4x4_1_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-02 08:46:28 +02:00
specialize qw/vp9_idct4x4_16_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct8x8_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct8x8_1_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct8x8_64_add sse2 neon dspr2 msa/ , "$ssse3_x86_64" ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct8x8_12_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct8x8_12_add sse2 neon dspr2 msa/ , "$ssse3_x86_64" ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct16x16_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct16x16_1_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct16x16_256_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct16x16_256_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct16x16_10_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct16x16_10_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct32x32_1024_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct32x32_1024_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_idct32x32_34_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct32x32_34_add sse2 neon_asm dspr2 msa/ ;
2014-02-18 14:56:46 +01:00
#is this a typo?
2014-10-03 00:43:27 +02:00
$ vp9_idct32x32_34_add_neon_asm = vp9_idct32x32_1024_add_neon ;
add_proto qw/void vp9_idct32x32_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_idct32x32_1_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iht4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type" ;
2015-06-02 08:46:28 +02:00
specialize qw/vp9_iht4x4_16_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iht8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_iht8x8_64_add sse2 neon dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iht16x16_256_add/ , "const tran_low_t *input, uint8_t *output, int pitch, int tx_type" ;
2015-06-01 05:49:01 +02:00
specialize qw/vp9_iht16x16_256_add sse2 dspr2 msa/ ;
2014-10-03 00:43:27 +02:00
# dct and add
add_proto qw/void vp9_iwht4x4_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-02 08:46:28 +02:00
specialize qw/vp9_iwht4x4_1_add msa/ ;
2014-10-03 00:43:27 +02:00
add_proto qw/void vp9_iwht4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride" ;
2015-06-02 08:46:28 +02:00
specialize qw/vp9_iwht4x4_16_add msa/ ;
2014-10-03 00:43:27 +02:00
}
2014-09-03 01:34:09 +02:00
}
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
# High bitdepth functions
if ( vpx_config ( "CONFIG_VP9_HIGHBITDEPTH" ) eq "yes" ) {
2014-09-15 21:59:19 +02:00
#
# Intra prediction
#
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d207_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d207_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d45_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d45_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d63_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d63_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_h_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_h_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d117_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d117_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d135_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d135_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d153_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d153_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_v_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
2015-04-01 02:45:25 +02:00
specialize qw/vp9_highbd_v_predictor_4x4/ , "$sse_x86inc" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_tm_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_tm_predictor_4x4/ , "$sse_x86inc" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_predictor_4x4/ , "$sse_x86inc" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_top_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_top_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_left_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_left_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_128_predictor_4x4/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_128_predictor_4x4/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d207_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d207_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d45_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d45_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d63_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d63_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_h_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_h_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d117_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d117_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d135_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d135_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d153_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d153_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_v_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_v_predictor_8x8/ , "$sse2_x86inc" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_tm_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_tm_predictor_8x8/ , "$sse2_x86inc" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_predictor_8x8/ , "$sse2_x86inc" ; ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_top_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_top_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_left_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_left_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_128_predictor_8x8/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_128_predictor_8x8/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d207_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d207_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d45_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d45_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d63_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d63_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_h_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_h_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d117_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d117_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d135_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d135_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d153_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d153_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_v_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
2015-04-01 02:45:25 +02:00
specialize qw/vp9_highbd_v_predictor_16x16/ , "$sse2_x86inc" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_tm_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_tm_predictor_16x16/ , "$sse2_x86_64" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_predictor_16x16/ , "$sse2_x86inc" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_top_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_top_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_left_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_left_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_128_predictor_16x16/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_128_predictor_16x16/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d207_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d207_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d45_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d45_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d63_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d63_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_h_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_h_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d117_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d117_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d135_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d135_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_d153_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_d153_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_v_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_v_predictor_32x32/ , "$sse2_x86inc" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_tm_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_tm_predictor_32x32/ , "$sse2_x86_64" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_predictor_32x32/ , "$sse2_x86_64" ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_top_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_top_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_left_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_left_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_dc_128_predictor_32x32/ , "uint16_t *dst, ptrdiff_t y_stride, const uint16_t *above, const uint16_t *left, int bd" ;
specialize qw/vp9_highbd_dc_128_predictor_32x32/ ;
2014-09-15 21:59:19 +02:00
2014-09-16 21:47:18 +02:00
#
# Sub Pixel Filters
#
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_convolve_copy/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps" ;
specialize qw/vp9_highbd_convolve_copy/ ;
2014-09-16 21:47:18 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_convolve_avg/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps" ;
specialize qw/vp9_highbd_convolve_avg/ ;
2014-09-16 21:47:18 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_convolve8/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps" ;
specialize qw/vp9_highbd_convolve8/ , "$sse2_x86_64" ;
2014-09-16 21:47:18 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_convolve8_horiz/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps" ;
specialize qw/vp9_highbd_convolve8_horiz/ , "$sse2_x86_64" ;
2014-09-16 21:47:18 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_convolve8_vert/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps" ;
specialize qw/vp9_highbd_convolve8_vert/ , "$sse2_x86_64" ;
2014-09-16 21:47:18 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_convolve8_avg/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps" ;
specialize qw/vp9_highbd_convolve8_avg/ , "$sse2_x86_64" ;
2014-09-16 21:47:18 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_convolve8_avg_horiz/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps" ;
specialize qw/vp9_highbd_convolve8_avg_horiz/ , "$sse2_x86_64" ;
2014-09-16 21:47:18 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_convolve8_avg_vert/ , "const uint8_t *src, ptrdiff_t src_stride, uint8_t *dst, ptrdiff_t dst_stride, const int16_t *filter_x, int x_step_q4, const int16_t *filter_y, int y_step_q4, int w, int h, int bps" ;
specialize qw/vp9_highbd_convolve8_avg_vert/ , "$sse2_x86_64" ;
2014-09-16 21:47:18 +02:00
2014-09-18 01:55:05 +02:00
#
# Loopfilter
#
add_proto qw/void vp9_highbd_lpf_vertical_16/ , "uint16_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int bd" ;
specialize qw/vp9_highbd_lpf_vertical_16 sse2/ ;
add_proto qw/void vp9_highbd_lpf_vertical_16_dual/ , "uint16_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int bd" ;
specialize qw/vp9_highbd_lpf_vertical_16_dual sse2/ ;
add_proto qw/void vp9_highbd_lpf_vertical_8/ , "uint16_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count, int bd" ;
specialize qw/vp9_highbd_lpf_vertical_8 sse2/ ;
add_proto qw/void vp9_highbd_lpf_vertical_8_dual/ , "uint16_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1, int bd" ;
specialize qw/vp9_highbd_lpf_vertical_8_dual sse2/ ;
add_proto qw/void vp9_highbd_lpf_vertical_4/ , "uint16_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count, int bd" ;
specialize qw/vp9_highbd_lpf_vertical_4 sse2/ ;
add_proto qw/void vp9_highbd_lpf_vertical_4_dual/ , "uint16_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1, int bd" ;
specialize qw/vp9_highbd_lpf_vertical_4_dual sse2/ ;
add_proto qw/void vp9_highbd_lpf_horizontal_16/ , "uint16_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count, int bd" ;
specialize qw/vp9_highbd_lpf_horizontal_16 sse2/ ;
add_proto qw/void vp9_highbd_lpf_horizontal_8/ , "uint16_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count, int bd" ;
specialize qw/vp9_highbd_lpf_horizontal_8 sse2/ ;
add_proto qw/void vp9_highbd_lpf_horizontal_8_dual/ , "uint16_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1, int bd" ;
specialize qw/vp9_highbd_lpf_horizontal_8_dual sse2/ ;
add_proto qw/void vp9_highbd_lpf_horizontal_4/ , "uint16_t *s, int pitch, const uint8_t *blimit, const uint8_t *limit, const uint8_t *thresh, int count, int bd" ;
specialize qw/vp9_highbd_lpf_horizontal_4 sse2/ ;
add_proto qw/void vp9_highbd_lpf_horizontal_4_dual/ , "uint16_t *s, int pitch, const uint8_t *blimit0, const uint8_t *limit0, const uint8_t *thresh0, const uint8_t *blimit1, const uint8_t *limit1, const uint8_t *thresh1, int bd" ;
specialize qw/vp9_highbd_lpf_horizontal_4_dual sse2/ ;
#
# post proc
#
if ( vpx_config ( "CONFIG_VP9_POSTPROC" ) eq "yes" ) {
add_proto qw/void vp9_highbd_mbpost_proc_down/ , "uint16_t *dst, int pitch, int rows, int cols, int flimit" ;
specialize qw/vp9_highbd_mbpost_proc_down/ ;
add_proto qw/void vp9_highbd_mbpost_proc_across_ip/ , "uint16_t *src, int pitch, int rows, int cols, int flimit" ;
specialize qw/vp9_highbd_mbpost_proc_across_ip/ ;
add_proto qw/void vp9_highbd_post_proc_down_and_across/ , "const uint16_t *src_ptr, uint16_t *dst_ptr, int src_pixels_per_line, int dst_pixels_per_line, int rows, int cols, int flimit" ;
specialize qw/vp9_highbd_post_proc_down_and_across/ ;
add_proto qw/void vp9_highbd_plane_add_noise/ , "uint8_t *Start, char *noise, char blackclamp[16], char whiteclamp[16], char bothclamp[16], unsigned int Width, unsigned int Height, int Pitch" ;
specialize qw/vp9_highbd_plane_add_noise/ ;
}
2014-09-03 01:34:09 +02:00
#
# dct
#
2014-10-03 00:43:27 +02:00
# Note as optimized versions of these functions are added we need to add a check to ensure
# that when CONFIG_EMULATE_HARDWARE is on, it defaults to the C versions only.
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_idct4x4_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct4x4_1_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_idct8x8_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct8x8_1_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_idct16x16_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct16x16_1_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_idct32x32_1024_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct32x32_1024_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_idct32x32_34_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct32x32_34_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_idct32x32_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct32x32_1_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_iht4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type, int bd" ;
specialize qw/vp9_highbd_iht4x4_16_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_iht8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type, int bd" ;
specialize qw/vp9_highbd_iht8x8_64_add/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_iht16x16_256_add/ , "const tran_low_t *input, uint8_t *output, int pitch, int tx_type, int bd" ;
specialize qw/vp9_highbd_iht16x16_256_add/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
# dct and add
2014-02-24 01:33:14 +01:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_iwht4x4_1_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_iwht4x4_1_add/ ;
2014-02-24 01:33:14 +01:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_iwht4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_iwht4x4_16_add/ ;
2014-10-24 09:48:02 +02:00
# Force C versions if CONFIG_EMULATE_HARDWARE is 1
if ( vpx_config ( "CONFIG_EMULATE_HARDWARE" ) eq "yes" ) {
add_proto qw/void vp9_highbd_idct4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct4x4_16_add/ ;
add_proto qw/void vp9_highbd_idct8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct8x8_64_add/ ;
add_proto qw/void vp9_highbd_idct8x8_10_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct8x8_10_add/ ;
add_proto qw/void vp9_highbd_idct16x16_256_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct16x16_256_add/ ;
add_proto qw/void vp9_highbd_idct16x16_10_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct16x16_10_add/ ;
} else {
add_proto qw/void vp9_highbd_idct4x4_16_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct4x4_16_add sse2/ ;
add_proto qw/void vp9_highbd_idct8x8_64_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct8x8_64_add sse2/ ;
add_proto qw/void vp9_highbd_idct8x8_10_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct8x8_10_add sse2/ ;
add_proto qw/void vp9_highbd_idct16x16_256_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct16x16_256_add sse2/ ;
add_proto qw/void vp9_highbd_idct16x16_10_add/ , "const tran_low_t *input, uint8_t *dest, int dest_stride, int bd" ;
specialize qw/vp9_highbd_idct16x16_10_add sse2/ ;
}
2014-09-03 01:34:09 +02:00
}
2014-02-24 01:33:14 +01:00
#
# Encoder functions below this point.
#
if ( vpx_config ( "CONFIG_VP9_ENCODER" ) eq "yes" ) {
# variance
add_proto qw/unsigned int vp9_sub_pixel_variance64x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2015-01-14 08:01:06 +01:00
specialize qw/vp9_sub_pixel_variance64x64 avx2 neon/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/unsigned int vp9_sub_pixel_avg_variance64x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-07-24 09:20:19 +02:00
specialize qw/vp9_sub_pixel_avg_variance64x64 avx2/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/unsigned int vp9_sub_pixel_variance32x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance32x64/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_avg_variance32x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance32x64/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance64x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance64x32/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_avg_variance64x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance64x32/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance32x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance32x16/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_avg_variance32x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance32x16/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance16x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance16x32/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_avg_variance16x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance16x32/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance32x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-07-24 09:20:19 +02:00
specialize qw/vp9_sub_pixel_variance32x32 avx2 neon/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/unsigned int vp9_sub_pixel_avg_variance32x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-07-24 09:20:19 +02:00
specialize qw/vp9_sub_pixel_avg_variance32x32 avx2/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/unsigned int vp9_sub_pixel_variance16x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-07-30 01:47:34 +02:00
specialize qw/vp9_sub_pixel_variance16x16 neon/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/unsigned int vp9_sub_pixel_avg_variance16x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance16x16/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance8x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance8x16/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_avg_variance8x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance8x16/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance16x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance16x8/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_avg_variance16x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance16x8/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance8x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-08-01 20:35:55 +02:00
specialize qw/vp9_sub_pixel_variance8x8 neon/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
2014-02-24 01:33:14 +01:00
add_proto qw/unsigned int vp9_sub_pixel_avg_variance8x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance8x8/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
# TODO(jingning): need to convert 8x4/4x8 functions into mmx/sse form
add_proto qw/unsigned int vp9_sub_pixel_variance8x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance8x4/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_avg_variance8x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance8x4/ , "$sse2_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance4x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance4x8/ , "$sse_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_avg_variance4x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance4x8/ , "$sse_x86inc" , "$ssse3_x86inc" ;
add_proto qw/unsigned int vp9_sub_pixel_variance4x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_sub_pixel_variance4x4/ , "$sse_x86inc" , "$ssse3_x86inc" ;
#vp9_sub_pixel_variance4x4_sse2=vp9_sub_pixel_variance4x4_wmt
add_proto qw/unsigned int vp9_sub_pixel_avg_variance4x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_sub_pixel_avg_variance4x4/ , "$sse_x86inc" , "$ssse3_x86inc" ;
2014-10-08 01:36:14 +02:00
add_proto qw/unsigned int vp9_avg_8x8/ , "const uint8_t *, int p" ;
2015-01-15 23:36:41 +01:00
specialize qw/vp9_avg_8x8 sse2 neon/ ;
2014-10-08 01:36:14 +02:00
2014-11-12 23:51:49 +01:00
add_proto qw/unsigned int vp9_avg_4x4/ , "const uint8_t *, int p" ;
specialize qw/vp9_avg_4x4 sse2/ ;
2015-04-16 02:48:20 +02:00
add_proto qw/void vp9_minmax_8x8/ , "const uint8_t *s, int p, const uint8_t *d, int dp, int *min, int *max" ;
specialize qw/vp9_minmax_8x8 sse2/ ;
2015-03-23 18:02:42 +01:00
add_proto qw/void vp9_hadamard_8x8/ , "int16_t const *src_diff, int src_stride, int16_t *coeff" ;
2015-04-04 18:48:18 +02:00
specialize qw/vp9_hadamard_8x8 sse2/ , "$ssse3_x86_64" ;
2015-03-23 18:02:42 +01:00
2015-03-30 21:31:46 +02:00
add_proto qw/void vp9_hadamard_16x16/ , "int16_t const *src_diff, int src_stride, int16_t *coeff" ;
specialize qw/vp9_hadamard_16x16 sse2/ ;
2015-03-23 18:02:42 +01:00
add_proto qw/int16_t vp9_satd/ , "const int16_t *coeff, int length" ;
specialize qw/vp9_satd sse2/ ;
Integral projection based motion estimation
This commit introduces a new block match motion estimation
using integral projection measurement. The 2-D block and the nearby
region is projected onto the horizontal and vertical 1-D vectors,
respectively. It then runs vector match, instead of block match,
over the two separate 1-D vectors to locate the motion compensated
reference block.
This process is run per 64x64 block to align the reference before
choosing partitioning in speed 6. The overall CPU cycle cost due
to this additional 64x64 block match (SSE2 version) takes around 2%
at low bit-rate rtc speed 6. When strong motion activities exist in
the video sequence, it substantially improves the partition
selection accuracy, thereby achieving better compression performance
and lower CPU cycles.
The experiments were tested in RTC speed -6 setting:
cloud 1080p 500 kbps
17006 b/f, 37.086 dB, 5386 ms ->
16669 b/f, 37.970 dB, 5085 ms (>0.9dB gain and 6% faster)
pedestrian_area 1080p 500 kbps
53537 b/f, 36.771 dB, 18706 ms ->
51897 b/f, 36.792 dB, 18585 ms (4% bit-rate savings)
blue_sky 1080p 500 kbps
70214 b/f, 33.600 dB, 13979 ms ->
53885 b/f, 33.645 dB, 10878 ms (30% bit-rate savings, 25% faster)
jimred 400 kbps
13380 b/f, 36.014 dB, 5723 ms ->
13377 b/f, 36.087 dB, 5831 ms (2% bit-rate savings, 2% slower)
Change-Id: Iffdb6ea5b16b77016bfa3dd3904d284168ae649c
2015-02-13 20:23:45 +01:00
add_proto qw/void vp9_int_pro_row/ , "int16_t *hbuf, uint8_t const *ref, const int ref_stride, const int height" ;
specialize qw/vp9_int_pro_row sse2/ ;
add_proto qw/int16_t vp9_int_pro_col/ , "uint8_t const *ref, const int width" ;
specialize qw/vp9_int_pro_col sse2/ ;
2015-02-27 22:35:22 +01:00
add_proto qw/int vp9_vector_var/ , "int16_t const *ref, int16_t const *src, const int bwl" ;
specialize qw/vp9_vector_var sse2/ ;
Integral projection based motion estimation
This commit introduces a new block match motion estimation
using integral projection measurement. The 2-D block and the nearby
region is projected onto the horizontal and vertical 1-D vectors,
respectively. It then runs vector match, instead of block match,
over the two separate 1-D vectors to locate the motion compensated
reference block.
This process is run per 64x64 block to align the reference before
choosing partitioning in speed 6. The overall CPU cycle cost due
to this additional 64x64 block match (SSE2 version) takes around 2%
at low bit-rate rtc speed 6. When strong motion activities exist in
the video sequence, it substantially improves the partition
selection accuracy, thereby achieving better compression performance
and lower CPU cycles.
The experiments were tested in RTC speed -6 setting:
cloud 1080p 500 kbps
17006 b/f, 37.086 dB, 5386 ms ->
16669 b/f, 37.970 dB, 5085 ms (>0.9dB gain and 6% faster)
pedestrian_area 1080p 500 kbps
53537 b/f, 36.771 dB, 18706 ms ->
51897 b/f, 36.792 dB, 18585 ms (4% bit-rate savings)
blue_sky 1080p 500 kbps
70214 b/f, 33.600 dB, 13979 ms ->
53885 b/f, 33.645 dB, 10878 ms (30% bit-rate savings, 25% faster)
jimred 400 kbps
13380 b/f, 36.014 dB, 5723 ms ->
13377 b/f, 36.087 dB, 5831 ms (2% bit-rate savings, 2% slower)
Change-Id: Iffdb6ea5b16b77016bfa3dd3904d284168ae649c
2015-02-13 20:23:45 +01:00
2014-10-16 15:36:07 +02:00
if ( vpx_config ( "CONFIG_VP9_HIGHBITDEPTH" ) eq "yes" ) {
add_proto qw/unsigned int vp9_highbd_avg_8x8/ , "const uint8_t *, int p" ;
specialize qw/vp9_highbd_avg_8x8/ ;
2014-11-12 23:51:49 +01:00
add_proto qw/unsigned int vp9_highbd_avg_4x4/ , "const uint8_t *, int p" ;
specialize qw/vp9_highbd_avg_4x4/ ;
2015-05-15 05:08:03 +02:00
add_proto qw/void vp9_highbd_minmax_8x8/ , "const uint8_t *s, int p, const uint8_t *d, int dp, int *min, int *max" ;
2015-04-16 02:48:20 +02:00
specialize qw/vp9_highbd_minmax_8x8/ ;
2014-10-16 15:36:07 +02:00
}
2014-02-24 01:33:14 +01:00
# ENCODEMB INVOKE
add_proto qw/void vp9_subtract_block/ , "int rows, int cols, int16_t *diff_ptr, ptrdiff_t diff_stride, const uint8_t *src_ptr, ptrdiff_t src_stride, const uint8_t *pred_ptr, ptrdiff_t pred_stride" ;
2014-07-30 21:16:04 +02:00
specialize qw/vp9_subtract_block neon/ , "$sse2_x86inc" ;
2014-02-24 01:33:14 +01:00
2014-09-19 01:45:53 +02:00
#
# Denoiser
#
if ( vpx_config ( "CONFIG_VP9_TEMPORAL_DENOISING" ) eq "yes" ) {
add_proto qw/int vp9_denoiser_filter/ , "const uint8_t *sig, int sig_stride, const uint8_t *mc_avg, int mc_avg_stride, uint8_t *avg, int avg_stride, int increase_denoising, BLOCK_SIZE bs, int motion_magnitude" ;
specialize qw/vp9_denoiser_filter sse2/ ;
}
2014-09-03 01:34:09 +02:00
if ( vpx_config ( "CONFIG_VP9_HIGHBITDEPTH" ) eq "yes" ) {
# the transform coefficients are held in 32-bit
# values, so the assembler code for vp9_block_error can no longer be used.
add_proto qw/int64_t vp9_block_error/ , "const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz" ;
specialize qw/vp9_block_error/ ;
2014-07-02 01:10:44 +02:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_quantize_fp/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-09-03 01:34:09 +02:00
specialize qw/vp9_quantize_fp/ ;
2014-07-07 21:08:40 +02:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_quantize_fp_32x32/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-09-03 01:34:09 +02:00
specialize qw/vp9_quantize_fp_32x32/ ;
2014-02-24 01:33:14 +01:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_quantize_b/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-09-03 01:34:09 +02:00
specialize qw/vp9_quantize_b/ ;
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_quantize_b_32x32/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-09-03 01:34:09 +02:00
specialize qw/vp9_quantize_b_32x32/ ;
2014-12-04 11:51:10 +01:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_fdct8x8_quant/ , "const int16_t *input, int stride, tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-12-04 11:51:10 +01:00
specialize qw/vp9_fdct8x8_quant/ ;
2014-09-03 01:34:09 +02:00
} else {
add_proto qw/int64_t vp9_block_error/ , "const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz" ;
2014-09-16 19:46:18 +02:00
specialize qw/vp9_block_error avx2/ , "$sse2_x86inc" ;
2014-09-03 01:34:09 +02:00
2015-04-01 02:46:41 +02:00
add_proto qw/int64_t vp9_block_error_fp/ , "const int16_t *coeff, const int16_t *dqcoeff, int block_size" ;
specialize qw/vp9_block_error_fp sse2/ ;
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_quantize_fp/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-11-18 17:58:09 +01:00
specialize qw/vp9_quantize_fp neon sse2/ , "$ssse3_x86_64" ;
2014-09-03 01:34:09 +02:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_quantize_fp_32x32/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-09-03 01:34:09 +02:00
specialize qw/vp9_quantize_fp_32x32/ , "$ssse3_x86_64" ;
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_quantize_b/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-10-14 00:17:05 +02:00
specialize qw/vp9_quantize_b sse2/ , "$ssse3_x86_64" ;
2014-09-03 01:34:09 +02:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_quantize_b_32x32/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-09-16 19:46:18 +02:00
specialize qw/vp9_quantize_b_32x32/ , "$ssse3_x86_64" ;
2014-12-04 11:51:10 +01:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_fdct8x8_quant/ , "const int16_t *input, int stride, tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2015-01-16 04:29:46 +01:00
specialize qw/vp9_fdct8x8_quant sse2 ssse3 neon/ ;
2014-09-03 01:34:09 +02:00
}
2014-02-24 01:33:14 +01:00
#
# Structured Similarity (SSIM)
#
if ( vpx_config ( "CONFIG_INTERNAL_STATS" ) eq "yes" ) {
add_proto qw/void vp9_ssim_parms_8x8/ , "uint8_t *s, int sp, uint8_t *r, int rp, unsigned long *sum_s, unsigned long *sum_r, unsigned long *sum_sq_s, unsigned long *sum_sq_r, unsigned long *sum_sxr" ;
specialize qw/vp9_ssim_parms_8x8/ , "$sse2_x86_64" ;
add_proto qw/void vp9_ssim_parms_16x16/ , "uint8_t *s, int sp, uint8_t *r, int rp, unsigned long *sum_s, unsigned long *sum_r, unsigned long *sum_sq_s, unsigned long *sum_sq_r, unsigned long *sum_sxr" ;
specialize qw/vp9_ssim_parms_16x16/ , "$sse2_x86_64" ;
}
# fdct functions
2014-09-03 01:34:09 +02:00
if ( vpx_config ( "CONFIG_VP9_HIGHBITDEPTH" ) eq "yes" ) {
add_proto qw/void vp9_fht4x4/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fht4x4 sse2/ ;
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fht8x8/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fht8x8 sse2/ ;
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fht16x16/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fht16x16 sse2/ ;
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fwht4x4/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fwht4x4/ , "$mmx_x86inc" ;
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct4x4_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct4x4_1 sse2/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct4x4/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct4x4 sse2/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct8x8_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct8x8_1 sse2/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct8x8/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct8x8 sse2/ ;
2014-05-30 03:14:17 +02:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct16x16_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct16x16_1 sse2/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct16x16/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct16x16 sse2/ ;
2014-05-30 03:14:17 +02:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct32x32_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct32x32_1 sse2/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct32x32/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct32x32 sse2/ ;
2014-05-30 03:14:17 +02:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct32x32_rd/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_fdct32x32_rd sse2/ ;
2014-09-03 01:34:09 +02:00
} else {
add_proto qw/void vp9_fht4x4/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
specialize qw/vp9_fht4x4 sse2/ ;
add_proto qw/void vp9_fht8x8/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
specialize qw/vp9_fht8x8 sse2/ ;
add_proto qw/void vp9_fht16x16/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
specialize qw/vp9_fht16x16 sse2/ ;
add_proto qw/void vp9_fwht4x4/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fwht4x4/ , "$mmx_x86inc" ;
add_proto qw/void vp9_fdct4x4_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct4x4_1 sse2/ ;
add_proto qw/void vp9_fdct4x4/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct4x4 sse2/ ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct8x8_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct8x8_1 sse2 neon/ ;
2014-05-30 03:14:17 +02:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct8x8/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct8x8 sse2 neon/ , "$ssse3_x86_64" ;
2014-02-24 01:33:14 +01:00
2014-09-03 01:34:09 +02:00
add_proto qw/void vp9_fdct16x16_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct16x16_1 sse2/ ;
add_proto qw/void vp9_fdct16x16/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct16x16 sse2/ ;
add_proto qw/void vp9_fdct32x32_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct32x32_1 sse2/ ;
add_proto qw/void vp9_fdct32x32/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct32x32 sse2 avx2/ ;
add_proto qw/void vp9_fdct32x32_rd/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_fdct32x32_rd sse2 avx2/ ;
}
2014-02-24 01:33:14 +01:00
#
# Motion search
#
2014-04-11 08:28:52 +02:00
add_proto qw/int vp9_full_search_sad/ , "const struct macroblock *x, const struct mv *ref_mv, int sad_per_bit, int distance, const struct vp9_variance_vtable *fn_ptr, const struct mv *center_mv, struct mv *best_mv" ;
2014-02-24 01:33:14 +01:00
specialize qw/vp9_full_search_sad sse3 sse4_1/ ;
$ vp9_full_search_sad_sse3 = vp9_full_search_sadx3 ;
$ vp9_full_search_sad_sse4_1 = vp9_full_search_sadx8 ;
2014-04-26 03:22:27 +02:00
add_proto qw/int vp9_diamond_search_sad/ , "const struct macroblock *x, const struct search_site_config *cfg, struct mv *ref_mv, struct mv *best_mv, int search_param, int sad_per_bit, int *num00, const struct vp9_variance_vtable *fn_ptr, const struct mv *center_mv" ;
2014-07-10 18:19:03 +02:00
specialize qw/vp9_diamond_search_sad/ ;
2014-02-24 01:33:14 +01:00
2014-04-26 03:22:27 +02:00
add_proto qw/int vp9_full_range_search/ , "const struct macroblock *x, const struct search_site_config *cfg, struct mv *ref_mv, struct mv *best_mv, int search_param, int sad_per_bit, int *num00, const struct vp9_variance_vtable *fn_ptr, const struct mv *center_mv" ;
2014-02-24 01:33:14 +01:00
specialize qw/vp9_full_range_search/ ;
2014-05-20 19:48:54 +02:00
add_proto qw/void vp9_temporal_filter_apply/ , "uint8_t *frame1, unsigned int stride, uint8_t *frame2, unsigned int block_width, unsigned int block_height, int strength, int filter_weight, unsigned int *accumulator, uint16_t *count" ;
2014-02-24 01:33:14 +01:00
specialize qw/vp9_temporal_filter_apply sse2/ ;
2014-09-06 00:00:54 +02:00
if ( vpx_config ( "CONFIG_VP9_HIGHBITDEPTH" ) eq "yes" ) {
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance64x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance64x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance64x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance64x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance32x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance32x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance32x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance32x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance64x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance64x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance64x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance64x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance32x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance32x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance32x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance32x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance16x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance16x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance16x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance16x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance32x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance32x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance32x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance32x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance16x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance16x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance16x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance16x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance8x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance8x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance8x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance8x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance16x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance16x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance16x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance16x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance8x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance8x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance8x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance8x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance8x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_variance8x4/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance8x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_sub_pixel_avg_variance8x4/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance4x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_highbd_sub_pixel_variance4x8/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance4x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_highbd_sub_pixel_avg_variance4x8/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_variance4x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_highbd_sub_pixel_variance4x4/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_sub_pixel_avg_variance4x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_highbd_sub_pixel_avg_variance4x4/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance64x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance64x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance64x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance64x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance32x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance32x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance32x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance32x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance64x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance64x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance64x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance64x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance32x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance32x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance32x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance32x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance16x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance16x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance16x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance16x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance32x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance32x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance32x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance32x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance16x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance16x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance16x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance16x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance8x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance8x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance8x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance8x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance16x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance16x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance16x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance16x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance8x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance8x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance8x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance8x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance8x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_variance8x4/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance8x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_10_sub_pixel_avg_variance8x4/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance4x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_highbd_10_sub_pixel_variance4x8/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance4x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_highbd_10_sub_pixel_avg_variance4x8/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_variance4x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_highbd_10_sub_pixel_variance4x4/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_10_sub_pixel_avg_variance4x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_highbd_10_sub_pixel_avg_variance4x4/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance64x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance64x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance64x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance64x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance32x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance32x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance32x64/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance32x64/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance64x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance64x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance64x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance64x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance32x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance32x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance32x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance32x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance16x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance16x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance16x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance16x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance32x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance32x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance32x32/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance32x32/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance16x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance16x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance16x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance16x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance8x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance8x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance8x16/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance8x16/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance16x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance16x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance16x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance16x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance8x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance8x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance8x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance8x8/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance8x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_variance8x4/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance8x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
2014-10-16 15:00:54 +02:00
specialize qw/vp9_highbd_12_sub_pixel_avg_variance8x4/ , "$sse2_x86inc" ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance4x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_highbd_12_sub_pixel_variance4x8/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance4x8/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_highbd_12_sub_pixel_avg_variance4x8/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_variance4x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse" ;
specialize qw/vp9_highbd_12_sub_pixel_variance4x4/ ;
2014-09-06 00:00:54 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/unsigned int vp9_highbd_12_sub_pixel_avg_variance4x4/ , "const uint8_t *src_ptr, int source_stride, int xoffset, int yoffset, const uint8_t *ref_ptr, int ref_stride, unsigned int *sse, const uint8_t *second_pred" ;
specialize qw/vp9_highbd_12_sub_pixel_avg_variance4x4/ ;
2014-09-06 00:00:54 +02:00
2014-09-03 01:34:09 +02:00
# ENCODEMB INVOKE
2014-10-08 21:43:22 +02:00
add_proto qw/int64_t vp9_highbd_block_error/ , "const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz, int bd" ;
2014-10-16 14:38:46 +02:00
specialize qw/vp9_highbd_block_error sse2/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_subtract_block/ , "int rows, int cols, int16_t *diff_ptr, ptrdiff_t diff_stride, const uint8_t *src_ptr, ptrdiff_t src_stride, const uint8_t *pred_ptr, ptrdiff_t pred_stride, int bd" ;
specialize qw/vp9_highbd_subtract_block/ ;
2014-09-03 01:34:09 +02:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_highbd_quantize_fp/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-10-08 21:43:22 +02:00
specialize qw/vp9_highbd_quantize_fp/ ;
2014-09-03 01:34:09 +02:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_highbd_quantize_fp_32x32/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-10-08 21:43:22 +02:00
specialize qw/vp9_highbd_quantize_fp_32x32/ ;
2014-09-03 01:34:09 +02:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_highbd_quantize_b/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-10-16 14:38:46 +02:00
specialize qw/vp9_highbd_quantize_b sse2/ ;
2014-09-03 01:34:09 +02:00
2014-12-22 18:35:29 +01:00
add_proto qw/void vp9_highbd_quantize_b_32x32/ , "const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan" ;
2014-10-16 14:38:46 +02:00
specialize qw/vp9_highbd_quantize_b_32x32 sse2/ ;
2014-09-03 01:34:09 +02:00
#
# Structured Similarity (SSIM)
#
if ( vpx_config ( "CONFIG_INTERNAL_STATS" ) eq "yes" ) {
2014-10-01 06:56:33 +02:00
add_proto qw/void vp9_highbd_ssim_parms_8x8/ , "uint16_t *s, int sp, uint16_t *r, int rp, uint32_t *sum_s, uint32_t *sum_r, uint32_t *sum_sq_s, uint32_t *sum_sq_r, uint32_t *sum_sxr" ;
specialize qw/vp9_highbd_ssim_parms_8x8/ ;
2014-09-03 01:34:09 +02:00
}
# fdct functions
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fht4x4/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_highbd_fht4x4 sse2/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fht8x8/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_highbd_fht8x8 sse2/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fht16x16/ , "const int16_t *input, tran_low_t *output, int stride, int tx_type" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_highbd_fht16x16 sse2/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fwht4x4/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_highbd_fwht4x4/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fdct4x4/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_highbd_fdct4x4 sse2/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fdct8x8_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_highbd_fdct8x8_1/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fdct8x8/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_highbd_fdct8x8 sse2/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fdct16x16_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_highbd_fdct16x16_1/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fdct16x16/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_highbd_fdct16x16 sse2/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fdct32x32_1/ , "const int16_t *input, tran_low_t *output, int stride" ;
specialize qw/vp9_highbd_fdct32x32_1/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fdct32x32/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_highbd_fdct32x32 sse2/ ;
2014-09-03 01:34:09 +02:00
2014-10-08 21:43:22 +02:00
add_proto qw/void vp9_highbd_fdct32x32_rd/ , "const int16_t *input, tran_low_t *output, int stride" ;
2014-10-24 09:48:02 +02:00
specialize qw/vp9_highbd_fdct32x32_rd sse2/ ;
2014-09-03 01:34:09 +02:00
2014-09-18 01:55:05 +02:00
add_proto qw/void vp9_highbd_temporal_filter_apply/ , "uint8_t *frame1, unsigned int stride, uint8_t *frame2, unsigned int block_width, unsigned int block_height, int strength, int filter_weight, unsigned int *accumulator, uint16_t *count" ;
specialize qw/vp9_highbd_temporal_filter_apply/ ;
2014-09-03 01:34:09 +02:00
2014-09-06 00:00:54 +02:00
}
2014-09-03 01:34:09 +02:00
# End vp9_high encoder functions
2014-09-06 00:00:54 +02:00
2014-02-24 01:33:14 +01:00
}
# end encoder functions
1 ;