
This patch removed the experiment of BIDIR_PRED and merged the feature into the experiment of EXT_REFS: (1) Each frame now has up to 6 reference frames, namely LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and BWDREF_FRAME, ALTREF_FRAME (backward); LAST4_FRAME has been removed; (2) First pass still keeps the 8 updates: KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE; (3) show_existing_frame==1 is supported in the experiment of EXT_REFS; (4) New encoding modes are added for both single-ref and compound cases, through the use of the 2 extra forward references (LAST2 & LAST3) and the 1 extra backward reference (BWDREF). RD performance wise, using Overall PSNR: Avg/BDRate Bipred only Prev EXT_REFS Current EXT_REFS with bipred lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387 derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252 midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636 If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to use 2 bi-predictive frames than 1, a further improvement may be obtained: Current EXT_REFS with bipred 1 bi-predictive frame 2 bi-predictive frames lowres: -4.613/-4.387 -4.675/-4.465 derflr: -3.120/-2.252 -3.333/-2.516 midres: -2.898/-2.636 -3.406/-3.095 Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
185 lines
5.0 KiB
C
185 lines
5.0 KiB
C
/*
|
|
* Copyright (c) 2010 The WebM project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#ifndef VP10_ENCODER_FIRSTPASS_H_
|
|
#define VP10_ENCODER_FIRSTPASS_H_
|
|
|
|
#include "vp10/encoder/lookahead.h"
|
|
#include "vp10/encoder/ratectrl.h"
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
#if CONFIG_FP_MB_STATS
|
|
|
|
#define FPMB_DCINTRA_MASK 0x01
|
|
|
|
#define FPMB_MOTION_ZERO_MASK 0x02
|
|
#define FPMB_MOTION_LEFT_MASK 0x04
|
|
#define FPMB_MOTION_RIGHT_MASK 0x08
|
|
#define FPMB_MOTION_UP_MASK 0x10
|
|
#define FPMB_MOTION_DOWN_MASK 0x20
|
|
|
|
#define FPMB_ERROR_SMALL_MASK 0x40
|
|
#define FPMB_ERROR_LARGE_MASK 0x80
|
|
#define FPMB_ERROR_SMALL_TH 2000
|
|
#define FPMB_ERROR_LARGE_TH 48000
|
|
|
|
typedef struct {
|
|
uint8_t *mb_stats_start;
|
|
uint8_t *mb_stats_end;
|
|
} FIRSTPASS_MB_STATS;
|
|
#endif
|
|
|
|
#if CONFIG_EXT_REFS
|
|
// Length of the bi-predictive frame group (BFG)
|
|
// NOTE: Currently each BFG contains one backward ref (BWF) frame plus a certain
|
|
// number of bi-predictive frames.
|
|
#define BFG_INTERVAL 2
|
|
#endif // CONFIG_EXT_REFS
|
|
|
|
#define VLOW_MOTION_THRESHOLD 950
|
|
|
|
typedef struct {
|
|
double frame;
|
|
double weight;
|
|
double intra_error;
|
|
double coded_error;
|
|
double sr_coded_error;
|
|
double pcnt_inter;
|
|
double pcnt_motion;
|
|
double pcnt_second_ref;
|
|
double pcnt_neutral;
|
|
double intra_skip_pct;
|
|
double inactive_zone_rows; // Image mask rows top and bottom.
|
|
double inactive_zone_cols; // Image mask columns at left and right edges.
|
|
double MVr;
|
|
double mvr_abs;
|
|
double MVc;
|
|
double mvc_abs;
|
|
double MVrv;
|
|
double MVcv;
|
|
double mv_in_out_count;
|
|
double new_mv_count;
|
|
double duration;
|
|
double count;
|
|
} FIRSTPASS_STATS;
|
|
|
|
typedef enum {
|
|
KF_UPDATE = 0,
|
|
LF_UPDATE = 1,
|
|
GF_UPDATE = 2,
|
|
ARF_UPDATE = 3,
|
|
OVERLAY_UPDATE = 4,
|
|
#if CONFIG_EXT_REFS
|
|
BRF_UPDATE = 5, // Backward Reference Frame
|
|
LAST_BIPRED_UPDATE = 6, // Last Bi-predictive Frame
|
|
BIPRED_UPDATE = 7, // Bi-predictive Frame, but not the last one
|
|
FRAME_UPDATE_TYPES = 8
|
|
#else
|
|
FRAME_UPDATE_TYPES = 5
|
|
#endif // CONFIG_EXT_REFS
|
|
} FRAME_UPDATE_TYPE;
|
|
|
|
#define FC_ANIMATION_THRESH 0.15
|
|
typedef enum {
|
|
FC_NORMAL = 0,
|
|
FC_GRAPHICS_ANIMATION = 1,
|
|
FRAME_CONTENT_TYPES = 2
|
|
} FRAME_CONTENT_TYPE;
|
|
|
|
typedef struct {
|
|
unsigned char index;
|
|
RATE_FACTOR_LEVEL rf_level[(MAX_LAG_BUFFERS * 2) + 1];
|
|
FRAME_UPDATE_TYPE update_type[(MAX_LAG_BUFFERS * 2) + 1];
|
|
unsigned char arf_src_offset[(MAX_LAG_BUFFERS * 2) + 1];
|
|
unsigned char arf_update_idx[(MAX_LAG_BUFFERS * 2) + 1];
|
|
unsigned char arf_ref_idx[(MAX_LAG_BUFFERS * 2) + 1];
|
|
#if CONFIG_EXT_REFS
|
|
unsigned char brf_src_offset[(MAX_LAG_BUFFERS * 2) + 1];
|
|
unsigned char bidir_pred_enabled[(MAX_LAG_BUFFERS * 2) + 1];
|
|
#endif // CONFIG_EXT_REFS
|
|
int bit_allocation[(MAX_LAG_BUFFERS * 2) + 1];
|
|
} GF_GROUP;
|
|
|
|
typedef struct {
|
|
unsigned int section_intra_rating;
|
|
FIRSTPASS_STATS total_stats;
|
|
FIRSTPASS_STATS this_frame_stats;
|
|
const FIRSTPASS_STATS *stats_in;
|
|
const FIRSTPASS_STATS *stats_in_start;
|
|
const FIRSTPASS_STATS *stats_in_end;
|
|
FIRSTPASS_STATS total_left_stats;
|
|
int first_pass_done;
|
|
int64_t bits_left;
|
|
double modified_error_min;
|
|
double modified_error_max;
|
|
double modified_error_left;
|
|
double mb_av_energy;
|
|
|
|
#if CONFIG_FP_MB_STATS
|
|
uint8_t *frame_mb_stats_buf;
|
|
uint8_t *this_frame_mb_stats;
|
|
FIRSTPASS_MB_STATS firstpass_mb_stats;
|
|
#endif
|
|
// An indication of the content type of the current frame
|
|
FRAME_CONTENT_TYPE fr_content_type;
|
|
|
|
// Projected total bits available for a key frame group of frames
|
|
int64_t kf_group_bits;
|
|
|
|
// Error score of frames still to be coded in kf group
|
|
int64_t kf_group_error_left;
|
|
|
|
// The fraction for a kf groups total bits allocated to the inter frames
|
|
double kfgroup_inter_fraction;
|
|
|
|
int sr_update_lag;
|
|
|
|
int kf_zeromotion_pct;
|
|
int last_kfgroup_zeromotion_pct;
|
|
int gf_zeromotion_pct;
|
|
int active_worst_quality;
|
|
int baseline_active_worst_quality;
|
|
int extend_minq;
|
|
int extend_maxq;
|
|
int extend_minq_fast;
|
|
|
|
GF_GROUP gf_group;
|
|
} TWO_PASS;
|
|
|
|
struct VP10_COMP;
|
|
|
|
void vp10_init_first_pass(struct VP10_COMP *cpi);
|
|
void vp10_rc_get_first_pass_params(struct VP10_COMP *cpi);
|
|
void vp10_first_pass(struct VP10_COMP *cpi,
|
|
const struct lookahead_entry *source);
|
|
void vp10_end_first_pass(struct VP10_COMP *cpi);
|
|
|
|
void vp10_init_second_pass(struct VP10_COMP *cpi);
|
|
void vp10_rc_get_second_pass_params(struct VP10_COMP *cpi);
|
|
void vp10_twopass_postencode_update(struct VP10_COMP *cpi);
|
|
|
|
// Post encode update of the rate control parameters for 2-pass
|
|
void vp10_twopass_postencode_update(struct VP10_COMP *cpi);
|
|
|
|
void vp10_init_subsampling(struct VP10_COMP *cpi);
|
|
|
|
void vp10_calculate_coded_size(struct VP10_COMP *cpi,
|
|
int *scaled_frame_width,
|
|
int *scaled_frame_height);
|
|
|
|
#ifdef __cplusplus
|
|
} // extern "C"
|
|
#endif
|
|
|
|
#endif // VP10_ENCODER_FIRSTPASS_H_
|