faf8c63b0f
Some initial experiments into discounting dead zone formating bars and intra skip blocks (common in some types of animation and graphics) in the calculation of the active max Q for each ARF/GF group. TODO: check for vertical formating bars and validate the horizontal bar at the bottom edge of the image. As expected, this change as it stands, does not make much difference for the natural videos in the std-hd and derf sets. However, for the yt and yt hd set there is a significant rise in the average PSNR with overall PSNR and SSIM remaining neutral. The mean rise for the YT-HD test set was > 6%. This is mainly because the change allows Q to drop further on titles and other graphics sections where spending a small number of extra bits gives a sharp rise in PSNR. Change-Id: I3f878ae91fc1854312d7ecf9fa792c17bc1aa6b7
166 lines
4.3 KiB
C
166 lines
4.3 KiB
C
/*
|
|
* Copyright (c) 2010 The WebM project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#ifndef VP9_ENCODER_VP9_FIRSTPASS_H_
|
|
#define VP9_ENCODER_VP9_FIRSTPASS_H_
|
|
|
|
#include "vp9/encoder/vp9_lookahead.h"
|
|
#include "vp9/encoder/vp9_ratectrl.h"
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
#if CONFIG_FP_MB_STATS
|
|
|
|
#define FPMB_DCINTRA_MASK 0x01
|
|
|
|
#define FPMB_MOTION_ZERO_MASK 0x02
|
|
#define FPMB_MOTION_LEFT_MASK 0x04
|
|
#define FPMB_MOTION_RIGHT_MASK 0x08
|
|
#define FPMB_MOTION_UP_MASK 0x10
|
|
#define FPMB_MOTION_DOWN_MASK 0x20
|
|
|
|
#define FPMB_ERROR_SMALL_MASK 0x40
|
|
#define FPMB_ERROR_LARGE_MASK 0x80
|
|
#define FPMB_ERROR_SMALL_TH 2000
|
|
#define FPMB_ERROR_LARGE_TH 48000
|
|
|
|
typedef struct {
|
|
uint8_t *mb_stats_start;
|
|
uint8_t *mb_stats_end;
|
|
} FIRSTPASS_MB_STATS;
|
|
#endif
|
|
|
|
#define VLOW_MOTION_THRESHOLD 950
|
|
|
|
typedef struct {
|
|
double frame;
|
|
double weight;
|
|
double intra_error;
|
|
double coded_error;
|
|
double sr_coded_error;
|
|
double pcnt_inter;
|
|
double pcnt_motion;
|
|
double pcnt_second_ref;
|
|
double pcnt_neutral;
|
|
double intra_skip_pct;
|
|
double inactive_zone_rows; // Image mask rows top and bottom.
|
|
double MVr;
|
|
double mvr_abs;
|
|
double MVc;
|
|
double mvc_abs;
|
|
double MVrv;
|
|
double MVcv;
|
|
double mv_in_out_count;
|
|
double new_mv_count;
|
|
double duration;
|
|
double count;
|
|
int64_t spatial_layer_id;
|
|
} FIRSTPASS_STATS;
|
|
|
|
typedef enum {
|
|
KF_UPDATE = 0,
|
|
LF_UPDATE = 1,
|
|
GF_UPDATE = 2,
|
|
ARF_UPDATE = 3,
|
|
OVERLAY_UPDATE = 4,
|
|
FRAME_UPDATE_TYPES = 5
|
|
} FRAME_UPDATE_TYPE;
|
|
|
|
#define FC_ANIMATION_THRESH 0.15
|
|
typedef enum {
|
|
FC_NORMAL = 0,
|
|
FC_GRAPHICS_ANIMATION = 1,
|
|
FRAME_CONTENT_TYPES = 2
|
|
} FRAME_CONTENT_TYPE;
|
|
|
|
typedef struct {
|
|
unsigned char index;
|
|
RATE_FACTOR_LEVEL rf_level[(MAX_LAG_BUFFERS * 2) + 1];
|
|
FRAME_UPDATE_TYPE update_type[(MAX_LAG_BUFFERS * 2) + 1];
|
|
unsigned char arf_src_offset[(MAX_LAG_BUFFERS * 2) + 1];
|
|
unsigned char arf_update_idx[(MAX_LAG_BUFFERS * 2) + 1];
|
|
unsigned char arf_ref_idx[(MAX_LAG_BUFFERS * 2) + 1];
|
|
int bit_allocation[(MAX_LAG_BUFFERS * 2) + 1];
|
|
} GF_GROUP;
|
|
|
|
typedef struct {
|
|
unsigned int section_intra_rating;
|
|
FIRSTPASS_STATS total_stats;
|
|
FIRSTPASS_STATS this_frame_stats;
|
|
const FIRSTPASS_STATS *stats_in;
|
|
const FIRSTPASS_STATS *stats_in_start;
|
|
const FIRSTPASS_STATS *stats_in_end;
|
|
FIRSTPASS_STATS total_left_stats;
|
|
int first_pass_done;
|
|
int64_t bits_left;
|
|
double modified_error_min;
|
|
double modified_error_max;
|
|
double modified_error_left;
|
|
double mb_av_energy;
|
|
|
|
#if CONFIG_FP_MB_STATS
|
|
uint8_t *frame_mb_stats_buf;
|
|
uint8_t *this_frame_mb_stats;
|
|
FIRSTPASS_MB_STATS firstpass_mb_stats;
|
|
#endif
|
|
// An indication of the content type of the current frame
|
|
FRAME_CONTENT_TYPE fr_content_type;
|
|
|
|
// Projected total bits available for a key frame group of frames
|
|
int64_t kf_group_bits;
|
|
|
|
// Error score of frames still to be coded in kf group
|
|
int64_t kf_group_error_left;
|
|
|
|
// The fraction for a kf groups total bits allocated to the inter frames
|
|
double kfgroup_inter_fraction;
|
|
|
|
int sr_update_lag;
|
|
|
|
int kf_zeromotion_pct;
|
|
int last_kfgroup_zeromotion_pct;
|
|
int gf_zeromotion_pct;
|
|
int active_worst_quality;
|
|
int baseline_active_worst_quality;
|
|
int extend_minq;
|
|
int extend_maxq;
|
|
int extend_minq_fast;
|
|
|
|
GF_GROUP gf_group;
|
|
} TWO_PASS;
|
|
|
|
struct VP9_COMP;
|
|
|
|
void vp9_init_first_pass(struct VP9_COMP *cpi);
|
|
void vp9_rc_get_first_pass_params(struct VP9_COMP *cpi);
|
|
void vp9_first_pass(struct VP9_COMP *cpi, const struct lookahead_entry *source);
|
|
void vp9_end_first_pass(struct VP9_COMP *cpi);
|
|
|
|
void vp9_init_second_pass(struct VP9_COMP *cpi);
|
|
void vp9_rc_get_second_pass_params(struct VP9_COMP *cpi);
|
|
void vp9_twopass_postencode_update(struct VP9_COMP *cpi);
|
|
|
|
// Post encode update of the rate control parameters for 2-pass
|
|
void vp9_twopass_postencode_update(struct VP9_COMP *cpi);
|
|
|
|
void vp9_init_subsampling(struct VP9_COMP *cpi);
|
|
|
|
void calculate_coded_size(struct VP9_COMP *cpi,
|
|
int *scaled_frame_width,
|
|
int *scaled_frame_height);
|
|
|
|
#ifdef __cplusplus
|
|
} // extern "C"
|
|
#endif
|
|
|
|
#endif // VP9_ENCODER_VP9_FIRSTPASS_H_
|