2010-05-18 17:58:33 +02:00
|
|
|
/*
|
2010-09-09 14:16:39 +02:00
|
|
|
* Copyright (c) 2010 The WebM project authors. All Rights Reserved.
|
2010-05-18 17:58:33 +02:00
|
|
|
*
|
2010-06-18 18:39:21 +02:00
|
|
|
* Use of this source code is governed by a BSD-style license
|
2010-06-04 22:19:40 +02:00
|
|
|
* that can be found in the LICENSE file in the root of the source
|
|
|
|
* tree. An additional intellectual property rights grant can be found
|
2010-06-18 18:39:21 +02:00
|
|
|
* in the file PATENTS. All contributing project authors may
|
2010-06-04 22:19:40 +02:00
|
|
|
* be found in the AUTHORS file in the root of the source tree.
|
2010-05-18 17:58:33 +02:00
|
|
|
*/
|
|
|
|
|
2012-11-30 01:36:10 +01:00
|
|
|
#ifndef VP9_ENCODER_VP9_ONYX_INT_H_
|
|
|
|
#define VP9_ENCODER_VP9_ONYX_INT_H_
|
2010-05-18 17:58:33 +02:00
|
|
|
|
|
|
|
#include <stdio.h>
|
2014-01-28 21:57:49 +01:00
|
|
|
|
2012-12-23 16:20:10 +01:00
|
|
|
#include "./vpx_config.h"
|
2014-01-28 21:57:49 +01:00
|
|
|
#include "vpx_ports/mem.h"
|
|
|
|
#include "vpx/internal/vpx_codec_internal.h"
|
|
|
|
|
|
|
|
#include "vp9/common/vp9_entropy.h"
|
|
|
|
#include "vp9/common/vp9_entropymode.h"
|
2012-11-27 22:59:17 +01:00
|
|
|
#include "vp9/common/vp9_onyx.h"
|
|
|
|
#include "vp9/common/vp9_onyxc_int.h"
|
2014-01-28 21:57:49 +01:00
|
|
|
|
2012-11-28 19:41:40 +01:00
|
|
|
#include "vp9/encoder/vp9_encodemb.h"
|
2014-02-06 03:28:28 +01:00
|
|
|
#include "vp9/encoder/vp9_firstpass.h"
|
2012-11-28 19:41:40 +01:00
|
|
|
#include "vp9/encoder/vp9_lookahead.h"
|
2014-02-03 21:35:06 +01:00
|
|
|
#include "vp9/encoder/vp9_mbgraph.h"
|
2014-01-28 21:57:49 +01:00
|
|
|
#include "vp9/encoder/vp9_mcomp.h"
|
|
|
|
#include "vp9/encoder/vp9_quantize.h"
|
|
|
|
#include "vp9/encoder/vp9_ratectrl.h"
|
|
|
|
#include "vp9/encoder/vp9_tokenize.h"
|
|
|
|
#include "vp9/encoder/vp9_treewriter.h"
|
|
|
|
#include "vp9/encoder/vp9_variance.h"
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2014-01-18 21:16:11 +01:00
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
2013-10-07 11:54:19 +02:00
|
|
|
// #define MODE_TEST_HIT_STATS
|
2013-08-21 13:34:14 +02:00
|
|
|
|
2013-04-03 00:08:50 +02:00
|
|
|
#if CONFIG_MULTIPLE_ARF
|
|
|
|
// Set MIN_GF_INTERVAL to 1 for the full decomposition.
|
|
|
|
#define MIN_GF_INTERVAL 2
|
|
|
|
#else
|
2010-05-18 17:58:33 +02:00
|
|
|
#define MIN_GF_INTERVAL 4
|
2013-04-03 00:08:50 +02:00
|
|
|
#endif
|
2014-02-08 00:52:41 +01:00
|
|
|
#define DEFAULT_GF_INTERVAL 10
|
2014-02-04 20:42:50 +01:00
|
|
|
#define DEFAULT_KF_BOOST 2000
|
2014-02-06 01:19:11 +01:00
|
|
|
#define DEFAULT_GF_BOOST 2000
|
2010-05-18 17:58:33 +02:00
|
|
|
|
|
|
|
#define KEY_FRAME_CONTEXT 5
|
|
|
|
|
2013-09-28 01:02:49 +02:00
|
|
|
#define MAX_MODES 30
|
|
|
|
#define MAX_REFS 6
|
Dual 16x16 inter prediction.
This patch introduces the concept of dual inter16x16 prediction. A
16x16 inter-predicted macroblock can use 2 references instead of 1,
where both references use the same mvmode (new, near/est, zero). In the
case of newmv, this means that two MVs are coded instead of one. The
frame can be encoded in 3 ways: all MBs single-prediction, all MBs dual
prediction, or per-MB single/dual prediction selection ("hybrid"), in
which case a single bit is coded per-MB to indicate whether the MB uses
single or dual inter prediction.
In the future, we can (maybe?) get further gains by mixing this with
Adrian's 32x32 work, per-segment dual prediction settings, or adding
support for dual splitmv/8x8mv inter prediction.
Gain (on derf-set, CQ mode) is ~2.8% (SSIM) or ~3.6% (glb PSNR). Most
gain is at medium/high bitrates, but there's minor gains at low bitrates
also. Output was confirmed to match between encoder and decoder.
Note for optimization people: this patch introduces a 2nd version of
16x16/8x8 sixtap/bilin functions, which does an avg instead of a
store. They may want to look and make sure this is implemented to
their satisfaction so we can optimize it best in the future.
Change-ID: I59dc84b07cbb3ccf073ac0f756d03d294cb19281
2011-12-06 20:53:02 +01:00
|
|
|
|
2010-05-18 17:58:33 +02:00
|
|
|
#define MIN_THRESHMULT 32
|
|
|
|
#define MAX_THRESHMULT 512
|
|
|
|
|
2013-03-22 16:47:17 +01:00
|
|
|
#define GF_ZEROMV_ZBIN_BOOST 0
|
|
|
|
#define LF_ZEROMV_ZBIN_BOOST 0
|
|
|
|
#define MV_ZBIN_BOOST 0
|
2013-03-21 19:37:48 +01:00
|
|
|
#define SPLIT_MV_ZBIN_BOOST 0
|
|
|
|
#define INTRA_ZBIN_BOOST 0
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
typedef struct {
|
2012-07-26 22:42:07 +02:00
|
|
|
int nmvjointcost[MV_JOINTS];
|
|
|
|
int nmvcosts[2][MV_VALS];
|
|
|
|
int nmvcosts_hp[2][MV_VALS];
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-10-31 22:40:53 +01:00
|
|
|
vp9_prob segment_pred_probs[PREDICTION_PROBS];
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
unsigned char *last_frame_seg_map_copy;
|
2012-04-11 16:44:14 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
// 0 = Intra, Last, GF, ARF
|
|
|
|
signed char last_ref_lf_deltas[MAX_REF_LF_DELTAS];
|
2013-06-07 07:55:31 +02:00
|
|
|
// 0 = ZERO_MV, MV
|
2012-07-14 00:21:29 +02:00
|
|
|
signed char last_mode_lf_deltas[MAX_MODE_LF_DELTAS];
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-09-28 01:41:20 +02:00
|
|
|
FRAME_CONTEXT fc;
|
2010-05-18 17:58:33 +02:00
|
|
|
} CODING_CONTEXT;
|
|
|
|
|
2013-07-18 17:41:44 +02:00
|
|
|
// This enumerator type needs to be kept aligned with the mode order in
|
|
|
|
// const MODE_DEFINITION vp9_mode_order[MAX_MODES] used in the rd code.
|
2012-07-14 00:21:29 +02:00
|
|
|
typedef enum {
|
|
|
|
THR_NEARESTMV,
|
2013-07-19 15:04:53 +02:00
|
|
|
THR_NEARESTA,
|
|
|
|
THR_NEARESTG,
|
2012-07-14 00:21:29 +02:00
|
|
|
|
2013-09-05 02:15:05 +02:00
|
|
|
THR_DC,
|
|
|
|
|
|
|
|
THR_NEWMV,
|
2013-07-19 15:04:53 +02:00
|
|
|
THR_NEWA,
|
2013-09-05 02:15:05 +02:00
|
|
|
THR_NEWG,
|
|
|
|
|
|
|
|
THR_NEARMV,
|
2012-07-14 00:21:29 +02:00
|
|
|
THR_NEARA,
|
2013-09-05 02:15:05 +02:00
|
|
|
THR_COMP_NEARESTLA,
|
|
|
|
THR_COMP_NEARESTGA,
|
2012-07-14 00:21:29 +02:00
|
|
|
|
|
|
|
THR_TM,
|
2012-06-26 01:23:58 +02:00
|
|
|
|
2013-07-19 15:04:53 +02:00
|
|
|
THR_COMP_NEARLA,
|
|
|
|
THR_COMP_NEWLA,
|
|
|
|
THR_NEARG,
|
|
|
|
THR_COMP_NEARGA,
|
|
|
|
THR_COMP_NEWGA,
|
2012-06-26 01:23:58 +02:00
|
|
|
|
2013-07-19 15:04:53 +02:00
|
|
|
THR_ZEROMV,
|
|
|
|
THR_ZEROG,
|
|
|
|
THR_ZEROA,
|
2012-07-14 00:21:29 +02:00
|
|
|
THR_COMP_ZEROLA,
|
|
|
|
THR_COMP_ZEROGA,
|
2012-06-26 01:23:58 +02:00
|
|
|
|
2013-07-19 15:04:53 +02:00
|
|
|
THR_H_PRED,
|
|
|
|
THR_V_PRED,
|
|
|
|
THR_D135_PRED,
|
2013-08-24 02:33:48 +02:00
|
|
|
THR_D207_PRED,
|
2013-07-19 15:04:53 +02:00
|
|
|
THR_D153_PRED,
|
|
|
|
THR_D63_PRED,
|
|
|
|
THR_D117_PRED,
|
|
|
|
THR_D45_PRED,
|
2013-05-31 01:34:59 +02:00
|
|
|
} THR_MODES;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-09-28 01:02:49 +02:00
|
|
|
typedef enum {
|
|
|
|
THR_LAST,
|
|
|
|
THR_GOLD,
|
|
|
|
THR_ALTR,
|
|
|
|
THR_COMP_LA,
|
|
|
|
THR_COMP_GA,
|
|
|
|
THR_INTRA,
|
|
|
|
} THR_MODES_SUB8X8;
|
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
typedef enum {
|
|
|
|
DIAMOND = 0,
|
|
|
|
NSTEP = 1,
|
2013-07-22 23:47:57 +02:00
|
|
|
HEX = 2,
|
|
|
|
BIGDIA = 3,
|
2014-02-15 00:55:49 +01:00
|
|
|
SQUARE = 4,
|
|
|
|
FAST_HEX = 5
|
2010-05-18 17:58:33 +02:00
|
|
|
} SEARCH_METHODS;
|
|
|
|
|
Tx size selection enhancements
(1) Refines the modeling function and uses that to add some speed
features. Specifically, intead of using a flag use_largest_txfm as
a speed feature, an enum tx_size_search_method is used, of which
two of the types are USE_FULL_RD and USE_LARGESTALL. Two other
new types are added:
USE_LARGESTINTRA (use largest only for intra)
USE_LARGESTINTRA_MODELINTER (use largest for intra, and model for
inter)
(2) Another change is that the framework for deciding transform type
is simplified to use a heuristic count based method rather than
an rd based method using txfm_cache. In practice the new method
is found to work just as well - with derf only -0.01 down.
The new method is more compatible with the new framework where
certain rd costs are based on full rd and certain others are
based on modeled rd or are not computed. In this patch the existing
rd based method is still kept for use in the USE_FULL_RD mode.
In the other modes, the count based method is used.
However the recommendation is to remove it eventually since the
benefit is limited, and will remove a lot of complications in
the code
(3) Finally a bug is fixed with the existing use_largest_txfm speed feature
that causes mismatches when the lossless mode and 4x4 WH transform is
forced.
Results on derf:
USE_FULL_RD: +0.03% (due to change in the tables), 0% encode time reduction
USE_LARGESTINTRA: -0.21%, 15% encode time reduction (this one is a
pretty good compromise)
USE_LARGESTINTRA_MODELINTER: -0.98%, 22% encode time reduction
(currently the benefit of modeling is limited for txfm size selection,
but keeping this enum as a placeholder) .
USE_LARGESTALL: -1.05%, 27% encode-time reduction (same as existing
use_largest_txfm speed feature).
Change-Id: I4d60a5f9ce78fbc90cddf2f97ed91d8bc0d4f936
2013-06-22 01:31:12 +02:00
|
|
|
typedef enum {
|
|
|
|
USE_FULL_RD = 0,
|
|
|
|
USE_LARGESTINTRA,
|
|
|
|
USE_LARGESTINTRA_MODELINTER,
|
|
|
|
USE_LARGESTALL
|
|
|
|
} TX_SIZE_SEARCH_METHOD;
|
|
|
|
|
2014-01-29 19:03:07 +01:00
|
|
|
typedef enum {
|
|
|
|
NOT_IN_USE = 0,
|
|
|
|
RELAXED_NEIGHBORING_MIN_MAX = 1,
|
|
|
|
STRICT_NEIGHBORING_MIN_MAX = 2
|
|
|
|
} AUTO_MIN_MAX_MODE;
|
|
|
|
|
2013-07-03 23:47:54 +02:00
|
|
|
typedef enum {
|
|
|
|
// Values should be powers of 2 so that they can be selected as bits of
|
|
|
|
// an integer flags field
|
|
|
|
|
|
|
|
// terminate search early based on distortion so far compared to
|
|
|
|
// qp step, distortion in the neighborhood of the frame, etc.
|
|
|
|
FLAG_EARLY_TERMINATE = 1,
|
|
|
|
|
|
|
|
// skips comp inter modes if the best so far is an intra mode
|
|
|
|
FLAG_SKIP_COMP_BESTINTRA = 2,
|
|
|
|
|
|
|
|
// skips comp inter modes if the best single intermode so far does
|
|
|
|
// not have the same reference as one of the two references being
|
|
|
|
// tested
|
|
|
|
FLAG_SKIP_COMP_REFMISMATCH = 4,
|
|
|
|
|
|
|
|
// skips oblique intra modes if the best so far is an inter mode
|
|
|
|
FLAG_SKIP_INTRA_BESTINTER = 8,
|
|
|
|
|
|
|
|
// skips oblique intra modes at angles 27, 63, 117, 153 if the best
|
|
|
|
// intra so far is not one of the neighboring directions
|
|
|
|
FLAG_SKIP_INTRA_DIRMISMATCH = 16,
|
2013-07-31 18:33:58 +02:00
|
|
|
|
|
|
|
// skips intra modes other than DC_PRED if the source variance
|
|
|
|
// is small
|
|
|
|
FLAG_SKIP_INTRA_LOWVAR = 32,
|
2013-07-03 23:47:54 +02:00
|
|
|
} MODE_SEARCH_SKIP_LOGIC;
|
|
|
|
|
2013-08-07 00:53:35 +02:00
|
|
|
typedef enum {
|
2013-12-19 20:20:56 +01:00
|
|
|
SUBPEL_TREE = 0,
|
2013-08-07 00:53:35 +02:00
|
|
|
// Other methods to come
|
|
|
|
} SUBPEL_SEARCH_METHODS;
|
|
|
|
|
2013-08-22 18:23:02 +02:00
|
|
|
#define ALL_INTRA_MODES 0x3FF
|
|
|
|
#define INTRA_DC_ONLY 0x01
|
|
|
|
#define INTRA_DC_TM ((1 << TM_PRED) | (1 << DC_PRED))
|
2013-10-11 02:29:46 +02:00
|
|
|
#define INTRA_DC_H_V ((1 << DC_PRED) | (1 << V_PRED) | (1 << H_PRED))
|
2013-08-22 18:23:02 +02:00
|
|
|
#define INTRA_DC_TM_H_V (INTRA_DC_TM | (1 << V_PRED) | (1 << H_PRED))
|
|
|
|
|
2013-10-01 17:57:18 +02:00
|
|
|
typedef enum {
|
|
|
|
LAST_FRAME_PARTITION_OFF = 0,
|
|
|
|
LAST_FRAME_PARTITION_LOW_MOTION = 1,
|
|
|
|
LAST_FRAME_PARTITION_ALL = 2
|
|
|
|
} LAST_FRAME_PARTITION_METHOD;
|
|
|
|
|
2014-02-06 01:19:11 +01:00
|
|
|
typedef enum {
|
|
|
|
// No recode.
|
|
|
|
DISALLOW_RECODE = 0,
|
|
|
|
// Allow recode for KF and exceeding maximum frame bandwidth.
|
|
|
|
ALLOW_RECODE_KFMAXBW = 1,
|
|
|
|
// Allow recode only for KF/ARF/GF frames.
|
|
|
|
ALLOW_RECODE_KFARFGF = 2,
|
|
|
|
// Allow recode for all frames based on bitrate constraints.
|
|
|
|
ALLOW_RECODE = 3,
|
|
|
|
} RECODE_LOOP_TYPE;
|
|
|
|
|
2014-02-04 20:09:34 +01:00
|
|
|
typedef enum {
|
|
|
|
// encode_breakout is disabled.
|
|
|
|
ENCODE_BREAKOUT_DISABLED = 0,
|
|
|
|
// encode_breakout is enabled.
|
|
|
|
ENCODE_BREAKOUT_ENABLED = 1,
|
|
|
|
// encode_breakout is enabled with small max_thresh limit.
|
|
|
|
ENCODE_BREAKOUT_LIMITED = 2
|
|
|
|
} ENCODE_BREAKOUT_TYPE;
|
|
|
|
|
2014-02-25 00:21:13 +01:00
|
|
|
typedef enum {
|
|
|
|
// Search partitions using RD/NONRD criterion
|
|
|
|
SEARCH_PARTITION = 0,
|
|
|
|
|
|
|
|
// Always use a fixed size partition
|
|
|
|
FIXED_PARTITION = 1,
|
|
|
|
|
|
|
|
// Use a fixed size partition in every 64X64 SB, where the size is
|
|
|
|
// determined based on source variance
|
|
|
|
VAR_BASED_FIXED_PARTITION = 2,
|
|
|
|
|
|
|
|
// Use an arbitrary partitioning scheme based on source variance within
|
|
|
|
// a 64X64 SB
|
|
|
|
VAR_BASED_PARTITION
|
|
|
|
} PARTITION_SEARCH_TYPE;
|
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
typedef struct {
|
2014-02-10 21:03:02 +01:00
|
|
|
// Frame level coding parameter update
|
|
|
|
int frame_parameter_update;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Motion search method (Diamond, NSTEP, Hex, Big Diamond, Square, etc).
|
2012-07-14 00:21:29 +02:00
|
|
|
SEARCH_METHODS search_method;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
2014-02-06 01:19:11 +01:00
|
|
|
RECODE_LOOP_TYPE recode_loop;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Subpel_search_method can only be subpel_tree which does a subpixel
|
|
|
|
// logarithmic search that keeps stepping at 1/2 pixel units until
|
|
|
|
// you stop getting a gain, and then goes on to 1/4 and repeats
|
|
|
|
// the same process. Along the way it skips many diagonals.
|
2013-08-07 00:53:35 +02:00
|
|
|
SUBPEL_SEARCH_METHODS subpel_search_method;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Maximum number of steps in logarithmic subpel search before giving up.
|
2013-08-07 00:53:35 +02:00
|
|
|
int subpel_iters_per_step;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
2014-01-22 23:57:03 +01:00
|
|
|
// Control when to stop subpel search
|
|
|
|
int subpel_force_stop;
|
|
|
|
|
2014-01-10 20:28:23 +01:00
|
|
|
// Thresh_mult is used to set a threshold for the rd score. A higher value
|
|
|
|
// means that we will accept the best mode so far more often. This number
|
|
|
|
// is used in combination with the current block size, and thresh_freq_fact
|
|
|
|
// to pick a threshold.
|
2012-07-14 00:21:29 +02:00
|
|
|
int thresh_mult[MAX_MODES];
|
2013-09-28 01:02:49 +02:00
|
|
|
int thresh_mult_sub8x8[MAX_REFS];
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// This parameter controls the number of steps we'll do in a diamond
|
|
|
|
// search.
|
2012-07-14 00:21:29 +02:00
|
|
|
int max_step_search_steps;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// This parameter controls which step in the n-step process we start at.
|
|
|
|
// It's changed adaptively based on circumstances.
|
2013-06-24 16:19:16 +02:00
|
|
|
int reduce_first_step_size;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// If this is set to 1, we limit the motion search range to 2 times the
|
|
|
|
// largest motion vector found in the last frame.
|
2013-06-26 18:06:25 +02:00
|
|
|
int auto_mv_step_size;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Trellis (dynamic programming) optimization of quantized values (+1, 0).
|
2012-07-14 00:21:29 +02:00
|
|
|
int optimize_coefficients;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Always set to 0. If on it enables 0 cost background transmission
|
|
|
|
// (except for the initial transmission of the segmentation). The feature is
|
|
|
|
// disabled because the addition of very large block sizes make the
|
|
|
|
// backgrounds very to cheap to encode, and the segmentation we have
|
|
|
|
// adds overhead.
|
2013-02-05 11:13:25 +01:00
|
|
|
int static_segmentation;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// If 1 we iterate finding a best reference for 2 ref frames together - via
|
|
|
|
// a log search that iterates 4 times (check around mv for last for best
|
|
|
|
// error of combined predictor then check around mv for alt). If 0 we
|
|
|
|
// we just use the best motion vector found for each frame by itself.
|
2013-06-04 16:58:53 +02:00
|
|
|
int comp_inter_joint_search_thresh;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// This variable is used to cap the maximum number of times we skip testing a
|
|
|
|
// mode to be evaluated. A high value means we will be faster.
|
2013-07-02 13:34:41 +02:00
|
|
|
int adaptive_rd_thresh;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Enables skipping the reconstruction step (idct, recon) in the
|
|
|
|
// intermediate steps assuming the last frame didn't have too many intra
|
|
|
|
// blocks and the q is less than a threshold.
|
2013-06-26 04:41:56 +02:00
|
|
|
int skip_encode_sb;
|
2013-07-09 01:48:47 +02:00
|
|
|
int skip_encode_frame;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// This variable allows us to reuse the last frames partition choices
|
|
|
|
// (64x64 v 32x32 etc) for this frame. It can be set to only use the last
|
|
|
|
// frame as a starting point in low motion scenes or always use it. If set
|
|
|
|
// we use last partitioning_redo frequency to determine how often to redo
|
|
|
|
// the partitioning from scratch. Adjust_partitioning_from_last_frame
|
|
|
|
// enables us to adjust up or down one partitioning from the last frames
|
|
|
|
// partitioning.
|
2013-10-01 17:57:18 +02:00
|
|
|
LAST_FRAME_PARTITION_METHOD use_lastframe_partitioning;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Determine which method we use to determine transform size. We can choose
|
|
|
|
// between options like full rd, largest for prediction size, largest
|
|
|
|
// for intra and model coefs for the rest.
|
Tx size selection enhancements
(1) Refines the modeling function and uses that to add some speed
features. Specifically, intead of using a flag use_largest_txfm as
a speed feature, an enum tx_size_search_method is used, of which
two of the types are USE_FULL_RD and USE_LARGESTALL. Two other
new types are added:
USE_LARGESTINTRA (use largest only for intra)
USE_LARGESTINTRA_MODELINTER (use largest for intra, and model for
inter)
(2) Another change is that the framework for deciding transform type
is simplified to use a heuristic count based method rather than
an rd based method using txfm_cache. In practice the new method
is found to work just as well - with derf only -0.01 down.
The new method is more compatible with the new framework where
certain rd costs are based on full rd and certain others are
based on modeled rd or are not computed. In this patch the existing
rd based method is still kept for use in the USE_FULL_RD mode.
In the other modes, the count based method is used.
However the recommendation is to remove it eventually since the
benefit is limited, and will remove a lot of complications in
the code
(3) Finally a bug is fixed with the existing use_largest_txfm speed feature
that causes mismatches when the lossless mode and 4x4 WH transform is
forced.
Results on derf:
USE_FULL_RD: +0.03% (due to change in the tables), 0% encode time reduction
USE_LARGESTINTRA: -0.21%, 15% encode time reduction (this one is a
pretty good compromise)
USE_LARGESTINTRA_MODELINTER: -0.98%, 22% encode time reduction
(currently the benefit of modeling is limited for txfm size selection,
but keeping this enum as a placeholder) .
USE_LARGESTALL: -1.05%, 27% encode-time reduction (same as existing
use_largest_txfm speed feature).
Change-Id: I4d60a5f9ce78fbc90cddf2f97ed91d8bc0d4f936
2013-06-22 01:31:12 +02:00
|
|
|
TX_SIZE_SEARCH_METHOD tx_size_search_method;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Low precision 32x32 fdct keeps everything in 16 bits and thus is less
|
|
|
|
// precise but significantly faster than the non lp version.
|
2013-08-08 00:22:51 +02:00
|
|
|
int use_lp32x32fdct;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// TODO(JBB): remove this as its no longer used.
|
|
|
|
|
|
|
|
// After looking at the first set of modes (set by index here), skip
|
|
|
|
// checking modes for reference frames that don't match the reference frame
|
|
|
|
// of the best so far.
|
2013-09-05 02:15:05 +02:00
|
|
|
int mode_skip_start;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// TODO(JBB): Remove this.
|
2013-07-01 17:27:12 +02:00
|
|
|
int reference_masking;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
2014-02-25 00:21:13 +01:00
|
|
|
PARTITION_SEARCH_TYPE partition_search_type;
|
|
|
|
|
|
|
|
// Used if partition_search_type = FIXED_SIZE_PARTITION
|
2013-08-27 20:05:08 +02:00
|
|
|
BLOCK_SIZE always_this_block_size;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
2014-02-25 00:21:13 +01:00
|
|
|
// Skip rectangular partition test when partition type none gives better
|
|
|
|
// rd than partition type split.
|
|
|
|
int less_rectangular_check;
|
|
|
|
|
|
|
|
// Disable testing non square partitions. (eg 16x32)
|
|
|
|
int use_square_partition_only;
|
|
|
|
|
2014-01-10 20:28:23 +01:00
|
|
|
// Sets min and max partition sizes for this 64x64 region based on the
|
2014-01-29 19:03:07 +01:00
|
|
|
// same 64x64 in last encoded frame, and the left and above neighbor.
|
|
|
|
AUTO_MIN_MAX_MODE auto_min_max_partition_size;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Min and max partition size we enable (block_size) as per auto
|
|
|
|
// min max, but also used by adjust partitioning, and pick_partitioning.
|
2013-08-27 20:05:08 +02:00
|
|
|
BLOCK_SIZE min_partition_size;
|
|
|
|
BLOCK_SIZE max_partition_size;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Whether or not we allow partitions one smaller or one greater than the last
|
|
|
|
// frame's partitioning. Only used if use_lastframe_partitioning is set.
|
2013-07-02 03:18:50 +02:00
|
|
|
int adjust_partitioning_from_last_frame;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// How frequently we re do the partitioning from scratch. Only used if
|
|
|
|
// use_lastframe_partitioning is set.
|
2013-07-02 03:18:50 +02:00
|
|
|
int last_partitioning_redo_frequency;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Disables sub 8x8 blocksizes in different scenarios: Choices are to disable
|
|
|
|
// it always, to allow it for only Last frame and Intra, disable it for all
|
|
|
|
// inter modes or to enable it always.
|
2013-10-04 15:10:25 +02:00
|
|
|
int disable_split_mask;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
2013-09-12 19:06:47 +02:00
|
|
|
// TODO(jingning): combine the related motion search speed features
|
2014-01-10 20:28:23 +01:00
|
|
|
// This allows us to use motion search at other sizes as a starting
|
|
|
|
// point for this motion search and limits the search range around it.
|
2013-09-12 19:06:47 +02:00
|
|
|
int adaptive_motion_search;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// Allows sub 8x8 modes to use the prediction filter that was determined
|
|
|
|
// best for 8x8 mode. If set to 0 we always re check all the filters for
|
|
|
|
// sizes less than 8x8, 1 means we check all filter modes if no 8x8 filter
|
|
|
|
// was selected, and 2 means we use 8 tap if no 8x8 filter mode was selected.
|
2014-01-24 21:26:57 +01:00
|
|
|
int adaptive_pred_interp_filter;
|
2013-07-03 23:47:54 +02:00
|
|
|
|
|
|
|
// Implements various heuristics to skip searching modes
|
|
|
|
// The heuristics selected are based on flags
|
|
|
|
// defined in the MODE_SEARCH_SKIP_HEURISTICS enum
|
|
|
|
unsigned int mode_search_skip_flags;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
Speed feature to skip split partition based on var
Adds a speed feature to disable split partition search based on a
given threshold on the source variance. A tighter threshold derived
from the threshold provided is used to also disable horizontal and
vertical partitions.
Results on derfraw300:
threshold = 16, psnr = -0.057%, speedup ~1% (football)
threshold = 32, psnr = -0.150%, speedup ~4-5% (football)
threshold = 64, psnr = -0.570%, speedup ~10-12% (football)
Results on stdhdraw250:
threshold = 32, psnr = -0.18%, speedup is somewhat more than derf
because of a larger number of smoother blocks at higher resolution.
Based on these results, a threshold of 32 is chosen for speed 1,
and a threshold of 64 is chosen for speeds 2 and above.
Change-Id: If08912fb6c67fd4242d12a0d094783a99f52f6c6
2013-08-03 02:15:38 +02:00
|
|
|
// A source variance threshold below which the split mode is disabled
|
|
|
|
unsigned int disable_split_var_thresh;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
Cleanup/enhancements of switchable filter search
Cleans up the switchable filter search logic. Also adds a
speed feature - a variance threshold - to disable filter search
if source variance is lower than this value.
Results: derfraw300
threshold = 16, psnr -0.238%, 4-5% speedup (tested on football)
threshold = 32, psnr -0.381%, 8-9% speedup (tested on football)
threshold = 64, psnr -0.611%, 12-13% speedup (tested on football)
threshold = 96, psnr -0.804%, 16-17% speedup (tested on football)
Based on these results, the threshold is chosen as 16 for speed 1,
32 for speed 2, 64 for speed 3 and 96 for speed 4.
Change-Id: Ib630d39192773b1983d3d349b97973768e170c04
2013-08-16 22:51:00 +02:00
|
|
|
// A source variance threshold below which filter search is disabled
|
|
|
|
// Choose a very large value (UINT_MAX) to use 8-tap always
|
|
|
|
unsigned int disable_filter_search_var_thresh;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// These bit masks allow you to enable or disable intra modes for each
|
|
|
|
// transform size separately.
|
2013-10-11 02:29:46 +02:00
|
|
|
int intra_y_mode_mask[TX_SIZES];
|
|
|
|
int intra_uv_mode_mask[TX_SIZES];
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// This variable enables an early break out of mode testing if the model for
|
|
|
|
// rd built from the prediction signal indicates a value that's much
|
|
|
|
// higher than the best rd we've seen so far.
|
2013-07-09 01:01:01 +02:00
|
|
|
int use_rd_breakout;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// This enables us to use an estimate for intra rd based on dc mode rather
|
|
|
|
// than choosing an actual uv mode in the stage of encoding before the actual
|
|
|
|
// final encode.
|
2013-07-16 19:12:34 +02:00
|
|
|
int use_uv_intra_rd_estimate;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
2014-01-23 22:24:20 +01:00
|
|
|
// This feature controls how the loop filter level is determined:
|
|
|
|
// 0: Try the full image with different values.
|
|
|
|
// 1: Try a small portion of the image with different values.
|
|
|
|
// 2: Estimate the level based on quantizer and frame type
|
2013-08-07 00:46:26 +02:00
|
|
|
int use_fast_lpf_pick;
|
2014-01-10 20:28:23 +01:00
|
|
|
|
|
|
|
// This feature limits the number of coefficients updates we actually do
|
|
|
|
// by only looking at counts from 1/2 the bands.
|
2013-08-28 00:07:50 +02:00
|
|
|
int use_fast_coef_updates; // 0: 2-loop, 1: 1-loop, 2: 1-loop reduced
|
2014-01-31 03:33:26 +01:00
|
|
|
|
2014-02-10 21:03:02 +01:00
|
|
|
// This flag controls the use of non-RD mode decision.
|
2014-02-25 00:21:13 +01:00
|
|
|
int use_nonrd_pick_mode;
|
2014-02-04 20:09:34 +01:00
|
|
|
|
|
|
|
// This variable sets the encode_breakout threshold. Currently, it is only
|
|
|
|
// enabled in real time mode.
|
|
|
|
int encode_breakout_thresh;
|
2010-05-18 17:58:33 +02:00
|
|
|
} SPEED_FEATURES;
|
|
|
|
|
2014-02-06 18:23:17 +01:00
|
|
|
typedef struct {
|
|
|
|
RATE_CONTROL rc;
|
|
|
|
int target_bandwidth;
|
|
|
|
int64_t starting_buffer_level;
|
|
|
|
int64_t optimal_buffer_level;
|
|
|
|
int64_t maximum_buffer_size;
|
|
|
|
double framerate;
|
2014-02-07 23:25:27 +01:00
|
|
|
int avg_frame_size;
|
2014-02-06 18:23:17 +01:00
|
|
|
} LAYER_CONTEXT;
|
|
|
|
|
2012-10-31 01:53:32 +01:00
|
|
|
typedef struct VP9_COMP {
|
2013-07-01 20:36:07 +02:00
|
|
|
DECLARE_ALIGNED(16, int16_t, y_quant[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, y_quant_shift[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, y_zbin[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, y_round[QINDEX_RANGE][8]);
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-07-01 20:36:07 +02:00
|
|
|
DECLARE_ALIGNED(16, int16_t, uv_quant[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, uv_quant_shift[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, uv_zbin[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, uv_round[QINDEX_RANGE][8]);
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-05-16 02:55:08 +02:00
|
|
|
#if CONFIG_ALPHA
|
2013-07-01 20:36:07 +02:00
|
|
|
DECLARE_ALIGNED(16, int16_t, a_quant[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, a_quant_shift[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, a_zbin[QINDEX_RANGE][8]);
|
|
|
|
DECLARE_ALIGNED(16, int16_t, a_round[QINDEX_RANGE][8]);
|
2013-05-16 02:55:08 +02:00
|
|
|
#endif
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
MACROBLOCK mb;
|
2012-10-31 01:53:32 +01:00
|
|
|
VP9_COMMON common;
|
2012-10-31 22:40:53 +01:00
|
|
|
VP9_CONFIG oxcf;
|
2012-07-14 00:21:29 +02:00
|
|
|
struct lookahead_ctx *lookahead;
|
|
|
|
struct lookahead_entry *source;
|
2013-04-03 00:08:50 +02:00
|
|
|
#if CONFIG_MULTIPLE_ARF
|
2013-12-06 01:23:09 +01:00
|
|
|
struct lookahead_entry *alt_ref_source[REF_FRAMES];
|
2013-04-03 00:08:50 +02:00
|
|
|
#else
|
2012-07-14 00:21:29 +02:00
|
|
|
struct lookahead_entry *alt_ref_source;
|
2013-04-03 00:08:50 +02:00
|
|
|
#endif
|
2011-04-13 20:00:18 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
YV12_BUFFER_CONFIG *Source;
|
|
|
|
YV12_BUFFER_CONFIG *un_scaled_source;
|
|
|
|
YV12_BUFFER_CONFIG scaled_source;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2014-02-13 23:08:38 +01:00
|
|
|
int key_frame_frequency;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-10-02 00:14:39 +02:00
|
|
|
int gold_is_last; // gold same as last frame ( short circuit gold searches)
|
|
|
|
int alt_is_last; // Alt same as last ( short circuit altref search)
|
2012-07-14 00:21:29 +02:00
|
|
|
int gold_is_alt; // don't do both alt and gold search ( just do gold).
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-02-20 21:34:31 +01:00
|
|
|
int scaled_ref_idx[3];
|
2013-01-15 22:49:44 +01:00
|
|
|
int lst_fb_idx;
|
|
|
|
int gld_fb_idx;
|
|
|
|
int alt_fb_idx;
|
2013-09-05 17:55:47 +02:00
|
|
|
|
2013-04-03 00:08:50 +02:00
|
|
|
#if CONFIG_MULTIPLE_ARF
|
2013-12-06 01:23:09 +01:00
|
|
|
int alt_ref_fb_idx[REF_FRAMES - 3];
|
2013-04-03 00:08:50 +02:00
|
|
|
#endif
|
2013-01-15 22:49:44 +01:00
|
|
|
int refresh_last_frame;
|
|
|
|
int refresh_golden_frame;
|
|
|
|
int refresh_alt_ref_frame;
|
2014-01-09 02:55:07 +01:00
|
|
|
|
|
|
|
int ext_refresh_frame_flags_pending;
|
|
|
|
int ext_refresh_last_frame;
|
|
|
|
int ext_refresh_golden_frame;
|
|
|
|
int ext_refresh_alt_ref_frame;
|
|
|
|
|
|
|
|
int ext_refresh_frame_context_pending;
|
|
|
|
int ext_refresh_frame_context;
|
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
YV12_BUFFER_CONFIG last_frame_uf;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
TOKENEXTRA *tok;
|
2013-06-12 19:30:06 +02:00
|
|
|
unsigned int tok_count[4][1 << 6];
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-04-03 00:08:50 +02:00
|
|
|
#if CONFIG_MULTIPLE_ARF
|
|
|
|
// Position within a frame coding order (including any additional ARF frames).
|
|
|
|
unsigned int sequence_number;
|
|
|
|
// Next frame in naturally occurring order that has not yet been coded.
|
|
|
|
int next_frame_in_order;
|
|
|
|
#endif
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
// Ambient reconstruction err target for force key frames
|
|
|
|
int ambient_err;
|
2011-01-17 18:23:11 +01:00
|
|
|
|
2013-10-07 20:20:10 +02:00
|
|
|
int rd_threshes[MAX_SEGMENTS][BLOCK_SIZES][MAX_MODES];
|
2013-08-10 02:47:32 +02:00
|
|
|
int rd_thresh_freq_fact[BLOCK_SIZES][MAX_MODES];
|
2013-10-07 20:20:10 +02:00
|
|
|
int rd_thresh_sub8x8[MAX_SEGMENTS][BLOCK_SIZES][MAX_REFS];
|
2013-09-28 01:02:49 +02:00
|
|
|
int rd_thresh_freq_sub8x8[BLOCK_SIZES][MAX_REFS];
|
2013-06-03 13:51:29 +02:00
|
|
|
|
2013-11-23 01:35:37 +01:00
|
|
|
int64_t rd_comp_pred_diff[REFERENCE_MODES];
|
|
|
|
int64_t rd_prediction_type_threshes[4][REFERENCE_MODES];
|
2013-07-29 22:38:40 +02:00
|
|
|
int64_t rd_tx_select_diff[TX_MODES];
|
2013-07-08 23:49:33 +02:00
|
|
|
// FIXME(rbultje) can this overflow?
|
2013-07-29 22:38:40 +02:00
|
|
|
int rd_tx_select_threshes[4][TX_MODES];
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-10-30 22:40:34 +01:00
|
|
|
int64_t rd_filter_diff[SWITCHABLE_FILTER_CONTEXTS];
|
|
|
|
int64_t rd_filter_threshes[4][SWITCHABLE_FILTER_CONTEXTS];
|
|
|
|
int64_t rd_filter_cache[SWITCHABLE_FILTER_CONTEXTS];
|
2013-12-17 02:52:59 +01:00
|
|
|
int64_t mask_filter_rd;
|
2013-07-08 23:49:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
int RDMULT;
|
|
|
|
int RDDIV;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
CODING_CONTEXT coding_context;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-11-06 22:13:59 +01:00
|
|
|
int zbin_mode_boost;
|
|
|
|
int zbin_mode_boost_enabled;
|
2012-07-14 00:21:29 +02:00
|
|
|
int active_arnr_frames; // <= cpi->oxcf.arnr_max_frames
|
2013-03-18 17:17:04 +01:00
|
|
|
int active_arnr_strength; // <= cpi->oxcf.arnr_max_strength
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-07-13 02:12:46 +02:00
|
|
|
double output_framerate;
|
2012-07-14 00:21:29 +02:00
|
|
|
int64_t last_time_stamp_seen;
|
|
|
|
int64_t last_end_time_stamp_seen;
|
|
|
|
int64_t first_time_stamp_ever;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-11-06 22:13:59 +01:00
|
|
|
RATE_CONTROL rc;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
int cq_target_quality;
|
2011-01-07 17:33:59 +01:00
|
|
|
|
2013-12-06 19:54:00 +01:00
|
|
|
vp9_coeff_count coef_counts[TX_SIZES][PLANE_TYPES];
|
|
|
|
vp9_coeff_probs_model frame_coef_probs[TX_SIZES][PLANE_TYPES];
|
|
|
|
vp9_coeff_stats frame_branch_ct[TX_SIZES][PLANE_TYPES];
|
32x32 transform for superblocks.
This adds Debargha's DCT/DWT hybrid and a regular 32x32 DCT, and adds
code all over the place to wrap that in the bitstream/encoder/decoder/RD.
Some implementation notes (these probably need careful review):
- token range is extended by 1 bit, since the value range out of this
transform is [-16384,16383].
- the coefficients coming out of the FDCT are manually scaled back by
1 bit, or else they won't fit in int16_t (they are 17 bits). Because
of this, the RD error scoring does not right-shift the MSE score by
two (unlike for 4x4/8x8/16x16).
- to compensate for this loss in precision, the quantizer is halved
also. This is currently a little hacky.
- FDCT and IDCT is double-only right now. Needs a fixed-point impl.
- There are no default probabilities for the 32x32 transform yet; I'm
simply using the 16x16 luma ones. A future commit will add newly
generated probabilities for all transforms.
- No ADST version. I don't think we'll add one for this level; if an
ADST is desired, transform-size selection can scale back to 16x16
or lower, and use an ADST at that level.
Additional notes specific to Debargha's DWT/DCT hybrid:
- coefficient scale is different for the top/left 16x16 (DCT-over-DWT)
block than for the rest (DWT pixel differences) of the block. Therefore,
RD error scoring isn't easily scalable between coefficient and pixel
domain. Thus, unfortunately, we need to compute the RD distortion in
the pixel domain until we figure out how to scale these appropriately.
Change-Id: I00386f20f35d7fabb19aba94c8162f8aee64ef2b
2012-12-07 23:45:05 +01:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
struct vpx_codec_pkt_list *output_pkt_list;
|
2010-10-14 22:40:12 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
MBGRAPH_FRAME_STATS mbgraph_stats[MAX_LAG_BUFFERS];
|
|
|
|
int mbgraph_n_frames; // number of frames filled in the above
|
|
|
|
int static_mb_pct; // % forced skip mbs by segmentation
|
|
|
|
int seg0_progress, seg0_idx, seg0_cnt;
|
|
|
|
|
|
|
|
// for real time encoding
|
2013-05-08 23:35:42 +02:00
|
|
|
int speed;
|
2012-07-14 00:21:29 +02:00
|
|
|
|
|
|
|
int cpu_used;
|
|
|
|
int pass;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2014-01-29 23:48:42 +01:00
|
|
|
vp9_prob last_skip_false_probs[3][SKIP_CONTEXTS];
|
2012-07-14 00:21:29 +02:00
|
|
|
int last_skip_probs_q[3];
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
int ref_frame_flags;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
SPEED_FEATURES sf;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-06-26 18:06:25 +02:00
|
|
|
unsigned int max_mv_magnitude;
|
2013-07-12 18:52:24 +02:00
|
|
|
int mv_step_param;
|
2013-06-26 18:06:25 +02:00
|
|
|
|
2014-02-04 20:09:34 +01:00
|
|
|
// Default value is 1. From first pass stats, encode_breakout may be disabled.
|
|
|
|
ENCODE_BREAKOUT_TYPE allow_encode_breakout;
|
|
|
|
|
|
|
|
// Get threshold from external input. In real time mode, it can be
|
|
|
|
// overwritten according to encoding speed.
|
|
|
|
int encode_breakout;
|
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
unsigned char *segmentation_map;
|
2011-09-13 12:26:39 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
// segment threashold for encode breakout
|
2013-07-23 13:09:04 +02:00
|
|
|
int segment_encode_breakout[MAX_SEGMENTS];
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-11-22 18:21:53 +01:00
|
|
|
unsigned char *complexity_map;
|
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
unsigned char *active_map;
|
|
|
|
unsigned int active_map_enabled;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
fractional_mv_step_fp *find_fractional_mv_step;
|
2013-08-08 02:01:43 +02:00
|
|
|
fractional_mv_step_comp_fp *find_fractional_mv_step_comp;
|
2012-10-31 22:40:53 +01:00
|
|
|
vp9_full_search_fn_t full_search_sad;
|
|
|
|
vp9_refining_search_fn_t refining_search_sad;
|
|
|
|
vp9_diamond_search_fn_t diamond_search_sad;
|
2013-08-10 02:47:32 +02:00
|
|
|
vp9_variance_fn_ptr_t fn_ptr[BLOCK_SIZES];
|
2012-08-11 02:05:46 +02:00
|
|
|
uint64_t time_receive_data;
|
|
|
|
uint64_t time_compress_data;
|
|
|
|
uint64_t time_pick_lpf;
|
2013-07-30 19:16:03 +02:00
|
|
|
uint64_t time_encode_sb_row;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2014-02-06 03:28:28 +01:00
|
|
|
struct twopass_rc twopass;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
YV12_BUFFER_CONFIG alt_ref_buffer;
|
|
|
|
YV12_BUFFER_CONFIG *frames[MAX_LAG_BUFFERS];
|
|
|
|
int fixed_divide[512];
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2011-04-29 18:37:59 +02:00
|
|
|
#if CONFIG_INTERNAL_STATS
|
2014-02-14 23:46:29 +01:00
|
|
|
unsigned int mode_chosen_counts[MAX_MODES];
|
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
int count;
|
|
|
|
double total_y;
|
|
|
|
double total_u;
|
|
|
|
double total_v;
|
|
|
|
double total;
|
2014-01-11 01:09:56 +01:00
|
|
|
uint64_t total_sq_error;
|
|
|
|
uint64_t total_samples;
|
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
double totalp_y;
|
|
|
|
double totalp_u;
|
|
|
|
double totalp_v;
|
|
|
|
double totalp;
|
2014-01-11 01:09:56 +01:00
|
|
|
uint64_t totalp_sq_error;
|
|
|
|
uint64_t totalp_samples;
|
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
int bytes;
|
|
|
|
double summed_quality;
|
|
|
|
double summed_weights;
|
2013-04-01 18:10:27 +02:00
|
|
|
double summedp_quality;
|
|
|
|
double summedp_weights;
|
2012-07-14 00:21:29 +02:00
|
|
|
unsigned int tot_recode_hits;
|
|
|
|
|
|
|
|
|
|
|
|
double total_ssimg_y;
|
|
|
|
double total_ssimg_u;
|
|
|
|
double total_ssimg_v;
|
|
|
|
double total_ssimg_all;
|
|
|
|
|
|
|
|
int b_calculate_ssimg;
|
2010-05-18 17:58:33 +02:00
|
|
|
#endif
|
2012-07-14 00:21:29 +02:00
|
|
|
int b_calculate_psnr;
|
2010-08-11 17:02:31 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
// Per MB activity measurement
|
|
|
|
unsigned int activity_avg;
|
|
|
|
unsigned int *mb_activity_map;
|
|
|
|
int *mb_norm_activity_map;
|
|
|
|
int output_partition;
|
2011-06-13 16:42:27 +02:00
|
|
|
|
2014-01-10 20:28:23 +01:00
|
|
|
// Force next frame to intra when kf_auto says so.
|
2012-07-14 00:21:29 +02:00
|
|
|
int force_next_frame_intra;
|
2011-08-25 22:54:45 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
int droppable;
|
2012-04-07 01:38:34 +02:00
|
|
|
|
2012-07-14 00:21:29 +02:00
|
|
|
int dummy_packing; /* flag to indicate if packing is dummy */
|
2012-05-02 22:53:15 +02:00
|
|
|
|
2013-09-25 02:24:35 +02:00
|
|
|
unsigned int tx_stepdown_count[TX_SIZES];
|
Tx size selection enhancements
(1) Refines the modeling function and uses that to add some speed
features. Specifically, intead of using a flag use_largest_txfm as
a speed feature, an enum tx_size_search_method is used, of which
two of the types are USE_FULL_RD and USE_LARGESTALL. Two other
new types are added:
USE_LARGESTINTRA (use largest only for intra)
USE_LARGESTINTRA_MODELINTER (use largest for intra, and model for
inter)
(2) Another change is that the framework for deciding transform type
is simplified to use a heuristic count based method rather than
an rd based method using txfm_cache. In practice the new method
is found to work just as well - with derf only -0.01 down.
The new method is more compatible with the new framework where
certain rd costs are based on full rd and certain others are
based on modeled rd or are not computed. In this patch the existing
rd based method is still kept for use in the USE_FULL_RD mode.
In the other modes, the count based method is used.
However the recommendation is to remove it eventually since the
benefit is limited, and will remove a lot of complications in
the code
(3) Finally a bug is fixed with the existing use_largest_txfm speed feature
that causes mismatches when the lossless mode and 4x4 WH transform is
forced.
Results on derf:
USE_FULL_RD: +0.03% (due to change in the tables), 0% encode time reduction
USE_LARGESTINTRA: -0.21%, 15% encode time reduction (this one is a
pretty good compromise)
USE_LARGESTINTRA_MODELINTER: -0.98%, 22% encode time reduction
(currently the benefit of modeling is limited for txfm size selection,
but keeping this enum as a placeholder) .
USE_LARGESTALL: -1.05%, 27% encode-time reduction (same as existing
use_largest_txfm speed feature).
Change-Id: I4d60a5f9ce78fbc90cddf2f97ed91d8bc0d4f936
2013-06-22 01:31:12 +02:00
|
|
|
|
2013-02-06 23:22:17 +01:00
|
|
|
int initial_width;
|
|
|
|
int initial_height;
|
2013-04-03 00:08:50 +02:00
|
|
|
|
2014-02-06 18:23:17 +01:00
|
|
|
int use_svc;
|
|
|
|
|
|
|
|
struct svc {
|
|
|
|
int spatial_layer_id;
|
|
|
|
int temporal_layer_id;
|
|
|
|
int number_spatial_layers;
|
|
|
|
int number_temporal_layers;
|
|
|
|
// Layer context used for rate control in CBR mode, only defined for
|
|
|
|
// temporal layers for now.
|
|
|
|
LAYER_CONTEXT layer_context[VPX_TS_MAX_LAYERS];
|
|
|
|
} svc;
|
|
|
|
|
2013-04-03 00:08:50 +02:00
|
|
|
#if CONFIG_MULTIPLE_ARF
|
|
|
|
// ARF tracking variables.
|
|
|
|
int multi_arf_enabled;
|
|
|
|
unsigned int frame_coding_order_period;
|
|
|
|
unsigned int new_frame_coding_order_period;
|
|
|
|
int frame_coding_order[MAX_LAG_BUFFERS * 2];
|
|
|
|
int arf_buffer_idx[MAX_LAG_BUFFERS * 3 / 2];
|
|
|
|
int arf_weight[MAX_LAG_BUFFERS];
|
|
|
|
int arf_buffered;
|
|
|
|
int this_frame_weight;
|
|
|
|
int max_arf_level;
|
|
|
|
#endif
|
2013-05-16 12:27:12 +02:00
|
|
|
|
|
|
|
#ifdef ENTROPY_STATS
|
2013-08-23 03:40:34 +02:00
|
|
|
int64_t mv_ref_stats[INTER_MODE_CONTEXTS][INTER_MODES - 1][2];
|
2013-05-16 12:27:12 +02:00
|
|
|
#endif
|
2013-08-21 13:34:14 +02:00
|
|
|
|
|
|
|
|
|
|
|
#ifdef MODE_TEST_HIT_STATS
|
|
|
|
// Debug / test stats
|
|
|
|
int64_t mode_test_hits[BLOCK_SIZES];
|
|
|
|
#endif
|
2013-10-24 18:10:59 +02:00
|
|
|
|
2014-01-10 20:28:23 +01:00
|
|
|
// Y,U,V,(A)
|
2013-10-24 18:10:59 +02:00
|
|
|
ENTROPY_CONTEXT *above_context[MAX_MB_PLANE];
|
|
|
|
ENTROPY_CONTEXT left_context[MAX_MB_PLANE][16];
|
|
|
|
|
2013-10-24 18:10:59 +02:00
|
|
|
PARTITION_CONTEXT *above_seg_context;
|
|
|
|
PARTITION_CONTEXT left_seg_context[8];
|
2012-10-31 01:53:32 +01:00
|
|
|
} VP9_COMP;
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2014-01-23 02:10:37 +01:00
|
|
|
static int get_ref_frame_idx(const VP9_COMP *cpi,
|
|
|
|
MV_REFERENCE_FRAME ref_frame) {
|
2013-05-21 00:59:39 +02:00
|
|
|
if (ref_frame == LAST_FRAME) {
|
|
|
|
return cpi->lst_fb_idx;
|
|
|
|
} else if (ref_frame == GOLDEN_FRAME) {
|
|
|
|
return cpi->gld_fb_idx;
|
|
|
|
} else {
|
|
|
|
return cpi->alt_fb_idx;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-01-06 23:50:54 +01:00
|
|
|
static YV12_BUFFER_CONFIG *get_ref_frame_buffer(VP9_COMP *cpi,
|
|
|
|
MV_REFERENCE_FRAME ref_frame) {
|
|
|
|
VP9_COMMON *const cm = &cpi->common;
|
2014-01-29 21:48:01 +01:00
|
|
|
return &cm->frame_bufs[cm->ref_frame_map[get_ref_frame_idx(cpi,
|
|
|
|
ref_frame)]].buf;
|
2014-01-06 23:50:54 +01:00
|
|
|
}
|
|
|
|
|
2012-10-31 01:53:32 +01:00
|
|
|
void vp9_encode_frame(VP9_COMP *cpi);
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2013-12-06 02:20:01 +01:00
|
|
|
void vp9_pack_bitstream(VP9_COMP *cpi, uint8_t *dest, size_t *size);
|
2010-05-18 17:58:33 +02:00
|
|
|
|
2012-10-31 01:53:32 +01:00
|
|
|
void vp9_set_speed_features(VP9_COMP *cpi);
|
2011-07-20 23:21:24 +02:00
|
|
|
|
2014-01-24 23:21:39 +01:00
|
|
|
int vp9_calc_ss_err(const YV12_BUFFER_CONFIG *source,
|
|
|
|
const YV12_BUFFER_CONFIG *reference);
|
2012-11-02 19:22:57 +01:00
|
|
|
|
2013-09-25 00:13:09 +02:00
|
|
|
void vp9_alloc_compressor_data(VP9_COMP *cpi);
|
2012-11-02 19:22:57 +01:00
|
|
|
|
2013-12-04 02:05:19 +01:00
|
|
|
int vp9_compute_qdelta(const VP9_COMP *cpi, double qstart, double qtarget);
|
2013-10-07 20:20:10 +02:00
|
|
|
|
2013-10-01 20:54:10 +02:00
|
|
|
static int get_token_alloc(int mb_rows, int mb_cols) {
|
|
|
|
return mb_rows * mb_cols * (48 * 16 + 4);
|
|
|
|
}
|
|
|
|
|
2014-01-28 01:00:20 +01:00
|
|
|
static void set_ref_ptrs(VP9_COMMON *cm, MACROBLOCKD *xd,
|
|
|
|
MV_REFERENCE_FRAME ref0, MV_REFERENCE_FRAME ref1) {
|
2014-01-30 07:02:24 +01:00
|
|
|
xd->block_refs[0] = &cm->frame_refs[ref0 >= LAST_FRAME ? ref0 - LAST_FRAME
|
|
|
|
: 0];
|
|
|
|
xd->block_refs[1] = &cm->frame_refs[ref1 >= LAST_FRAME ? ref1 - LAST_FRAME
|
|
|
|
: 0];
|
2014-01-28 01:00:20 +01:00
|
|
|
}
|
|
|
|
|
2014-01-18 21:16:11 +01:00
|
|
|
#ifdef __cplusplus
|
|
|
|
} // extern "C"
|
|
|
|
#endif
|
|
|
|
|
2012-12-19 00:31:19 +01:00
|
|
|
#endif // VP9_ENCODER_VP9_ONYX_INT_H_
|