80465dae88
This SSE2 is based on VP8 denoiser's SSE2 code. In VP8, there are only 16x16 blocks in denoiser, while in VP9, there are 13 different block sizes. By adding this SSE2 code, the improvement of encoder speed is around 20%(using C code vs using SSE2 code), vary for different clips. The unit test for VP9 denoiser is to confirm that the SSE2 code is bit-exact with the C code. The unit test covers all block size. Change-Id: Ic8d8ac26db4ea40a5f146b5678a065af07eaaa3d
139 lines
5.8 KiB
Makefile
139 lines
5.8 KiB
Makefile
##
|
|
## Copyright (c) 2010 The WebM project authors. All Rights Reserved.
|
|
##
|
|
## Use of this source code is governed by a BSD-style license
|
|
## that can be found in the LICENSE file in the root of the source
|
|
## tree. An additional intellectual property rights grant can be found
|
|
## in the file PATENTS. All contributing project authors may
|
|
## be found in the AUTHORS file in the root of the source tree.
|
|
##
|
|
|
|
VP9_CX_EXPORTS += exports_enc
|
|
|
|
VP9_CX_SRCS-yes += $(VP9_COMMON_SRCS-yes)
|
|
VP9_CX_SRCS-no += $(VP9_COMMON_SRCS-no)
|
|
VP9_CX_SRCS_REMOVE-yes += $(VP9_COMMON_SRCS_REMOVE-yes)
|
|
VP9_CX_SRCS_REMOVE-no += $(VP9_COMMON_SRCS_REMOVE-no)
|
|
|
|
VP9_CX_SRCS-yes += vp9_cx_iface.c
|
|
|
|
VP9_CX_SRCS-yes += encoder/vp9_bitstream.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_context_tree.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_context_tree.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_cost.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_cost.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_dct.c
|
|
VP9_CX_SRCS-$(CONFIG_VP9_TEMPORAL_DENOISING) += encoder/vp9_denoiser.c
|
|
VP9_CX_SRCS-$(CONFIG_VP9_TEMPORAL_DENOISING) += encoder/vp9_denoiser.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_encodeframe.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_encodeframe.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_encodemb.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_encodemv.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_extend.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_firstpass.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_block.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_writer.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_writer.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_write_bit_buffer.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_write_bit_buffer.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_bitstream.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_encodemb.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_encodemv.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_extend.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_firstpass.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_lookahead.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_lookahead.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_mcomp.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_encoder.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_quantize.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_ratectrl.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_rd.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_rdopt.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_pickmode.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_svc_layercontext.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_tokenize.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_treewriter.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_variance.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_mcomp.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_encoder.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_picklpf.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_picklpf.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_quantize.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_ratectrl.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_rd.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_rdopt.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_pickmode.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_sad.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_segmentation.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_segmentation.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_speed_features.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_speed_features.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_subexp.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_subexp.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_svc_layercontext.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_resize.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_resize.h
|
|
VP9_CX_SRCS-$(CONFIG_INTERNAL_STATS) += encoder/vp9_ssim.c
|
|
VP9_CX_SRCS-$(CONFIG_INTERNAL_STATS) += encoder/vp9_ssim.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_tokenize.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_treewriter.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_variance.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_aq_variance.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_aq_variance.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_aq_cyclicrefresh.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_aq_cyclicrefresh.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_aq_complexity.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_aq_complexity.h
|
|
ifeq ($(CONFIG_VP9_POSTPROC),yes)
|
|
VP9_CX_SRCS-$(CONFIG_INTERNAL_STATS) += common/vp9_postproc.h
|
|
VP9_CX_SRCS-$(CONFIG_INTERNAL_STATS) += common/vp9_postproc.c
|
|
endif
|
|
VP9_CX_SRCS-yes += encoder/vp9_temporal_filter.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_temporal_filter.h
|
|
VP9_CX_SRCS-yes += encoder/vp9_mbgraph.c
|
|
VP9_CX_SRCS-yes += encoder/vp9_mbgraph.h
|
|
|
|
VP9_CX_SRCS-$(HAVE_AVX2) += encoder/x86/vp9_variance_impl_intrin_avx2.c
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_sad4d_sse2.asm
|
|
VP9_CX_SRCS-$(HAVE_AVX2) += encoder/x86/vp9_sad4d_intrin_avx2.c
|
|
VP9_CX_SRCS-$(HAVE_AVX2) += encoder/x86/vp9_subpel_variance_impl_intrin_avx2.c
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_temporal_filter_apply_sse2.asm
|
|
VP9_CX_SRCS-$(HAVE_SSE3) += encoder/x86/vp9_sad_sse3.asm
|
|
|
|
ifeq ($(CONFIG_USE_X86INC),yes)
|
|
VP9_CX_SRCS-$(HAVE_MMX) += encoder/x86/vp9_dct_mmx.asm
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_error_sse2.asm
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_sad_sse2.asm
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_subtract_sse2.asm
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_variance_sse2.c
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_subpel_variance.asm
|
|
endif
|
|
|
|
ifeq ($(ARCH_X86_64),yes)
|
|
VP9_CX_SRCS-$(HAVE_SSSE3) += encoder/x86/vp9_quantize_ssse3_x86_64.asm
|
|
VP9_CX_SRCS-$(HAVE_SSSE3) += encoder/x86/vp9_dct_ssse3_x86_64.asm
|
|
endif
|
|
VP9_CX_SRCS-$(HAVE_SSSE3) += encoder/x86/vp9_sad_ssse3.asm
|
|
VP9_CX_SRCS-$(HAVE_SSE4_1) += encoder/x86/vp9_sad_sse4.asm
|
|
VP9_CX_SRCS-$(ARCH_X86_64) += encoder/x86/vp9_ssim_opt_x86_64.asm
|
|
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_dct_sse2.c
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_dct32x32_sse2.c
|
|
|
|
ifeq ($(CONFIG_VP9_TEMPORAL_DENOISING),yes)
|
|
VP9_CX_SRCS-$(HAVE_SSE2) += encoder/x86/vp9_denoiser_sse2.c
|
|
endif
|
|
|
|
VP9_CX_SRCS-$(HAVE_AVX2) += encoder/x86/vp9_dct32x32_avx2.c
|
|
VP9_CX_SRCS-$(HAVE_AVX2) += encoder/x86/vp9_dct_avx2.c
|
|
VP9_CX_SRCS-$(HAVE_AVX2) += encoder/x86/vp9_error_intrin_avx2.c
|
|
VP9_CX_SRCS-$(HAVE_AVX2) += encoder/x86/vp9_variance_avx2.c
|
|
|
|
VP9_CX_SRCS-$(HAVE_NEON) += encoder/arm/neon/vp9_sad_neon.c
|
|
VP9_CX_SRCS-$(HAVE_NEON) += encoder/arm/neon/vp9_dct_neon.c
|
|
VP9_CX_SRCS-$(HAVE_NEON) += encoder/arm/neon/vp9_variance_neon.c
|
|
VP9_CX_SRCS-$(HAVE_NEON) += encoder/arm/neon/vp9_quantize_neon.c
|
|
VP9_CX_SRCS-$(HAVE_NEON) += encoder/arm/neon/vp9_subtract_neon.c
|
|
|
|
VP9_CX_SRCS-yes := $(filter-out $(VP9_CX_SRCS_REMOVE-yes),$(VP9_CX_SRCS-yes))
|