Adjustments to cyclic refresh (aq-mode=3).
Target higher delta-qp for big blocks with zero motion, and for segment#1: avoid 64x64 partition size and force 8x8 tx size. Metrics on RTC set mostly positive: SSIM up by ~4%, PSRN by ~1.5%. Doesn't seem to be any change in speed. Change-Id: I1f68fa3c4f62dab3b90cc58041f05ebb048ae5ac
This commit is contained in:
parent
a28a8cb726
commit
0187f4b411
@ -96,30 +96,35 @@ static int apply_cyclic_refresh_bitrate(const VP9_COMMON *cm,
|
||||
static int candidate_refresh_aq(const CYCLIC_REFRESH *cr,
|
||||
const MB_MODE_INFO *mbmi,
|
||||
int64_t rate,
|
||||
int64_t dist) {
|
||||
int64_t dist,
|
||||
int bsize) {
|
||||
MV mv = mbmi->mv[0].as_mv;
|
||||
// If projected rate is below the thresh_rate accept it for lower-qp coding.
|
||||
// Otherwise, reject the block for lower-qp coding if projected distortion
|
||||
// Reject the block for lower-qp coding if projected distortion
|
||||
// is above the threshold, and any of the following is true:
|
||||
// 1) mode uses large mv
|
||||
// 2) mode is an intra-mode
|
||||
if (rate < cr->thresh_rate_sb)
|
||||
return 1;
|
||||
else if (dist > cr->thresh_dist_sb &&
|
||||
(mv.row > cr->motion_thresh || mv.row < -cr->motion_thresh ||
|
||||
mv.col > cr->motion_thresh || mv.col < -cr->motion_thresh ||
|
||||
!is_inter_block(mbmi)))
|
||||
return 0;
|
||||
// Otherwise accept for refresh.
|
||||
if (dist > cr->thresh_dist_sb &&
|
||||
(mv.row > cr->motion_thresh || mv.row < -cr->motion_thresh ||
|
||||
mv.col > cr->motion_thresh || mv.col < -cr->motion_thresh ||
|
||||
!is_inter_block(mbmi)))
|
||||
return CR_SEGMENT_ID_BASE;
|
||||
else if (bsize >= BLOCK_32X32 &&
|
||||
rate < cr->thresh_rate_sb &&
|
||||
is_inter_block(mbmi) &&
|
||||
mbmi->mv[0].as_int == 0)
|
||||
// More aggressive delta-q for bigger blocks with zero motion.
|
||||
return CR_SEGMENT_ID_BOOST2;
|
||||
else
|
||||
return 1;
|
||||
return CR_SEGMENT_ID_BOOST1;
|
||||
}
|
||||
|
||||
// Compute delta-q for the segment.
|
||||
static int compute_deltaq(const VP9_COMP *cpi, int q) {
|
||||
static int compute_deltaq(const VP9_COMP *cpi, int q, double rate_factor) {
|
||||
const CYCLIC_REFRESH *const cr = cpi->cyclic_refresh;
|
||||
const RATE_CONTROL *const rc = &cpi->rc;
|
||||
int deltaq = vp9_compute_qdelta_by_rate(rc, cpi->common.frame_type,
|
||||
q, cr->rate_ratio_qdelta,
|
||||
q, rate_factor,
|
||||
cpi->common.bit_depth);
|
||||
if ((-deltaq) > cr->max_qdelta_perc * q / 100) {
|
||||
deltaq = -cr->max_qdelta_perc * q / 100;
|
||||
@ -128,8 +133,9 @@ static int compute_deltaq(const VP9_COMP *cpi, int q) {
|
||||
}
|
||||
|
||||
// For the just encoded frame, estimate the bits, incorporating the delta-q
|
||||
// from segment 1. This function is called in the postencode (called from
|
||||
// rc_update_rate_correction_factors()).
|
||||
// from non-base segment. For now ignore effect of multiple segments
|
||||
// (with different delta-q). Note this function is called in the postencode
|
||||
// (called from rc_update_rate_correction_factors()).
|
||||
int vp9_cyclic_refresh_estimate_bits_at_q(const VP9_COMP *cpi,
|
||||
double correction_factor) {
|
||||
const VP9_COMMON *const cm = &cpi->common;
|
||||
@ -137,11 +143,11 @@ int vp9_cyclic_refresh_estimate_bits_at_q(const VP9_COMP *cpi,
|
||||
int estimated_bits;
|
||||
int mbs = cm->MBs;
|
||||
int num8x8bl = mbs << 2;
|
||||
// Weight for segment 1: use actual number of blocks refreshed in
|
||||
// Weight for non-base segments: use actual number of blocks refreshed in
|
||||
// previous/just encoded frame. Note number of blocks here is in 8x8 units.
|
||||
double weight_segment = (double)cr->actual_num_seg_blocks / num8x8bl;
|
||||
// Compute delta-q that was used in the just encoded frame.
|
||||
int deltaq = compute_deltaq(cpi, cm->base_qindex);
|
||||
int deltaq = compute_deltaq(cpi, cm->base_qindex, cr->rate_ratio_qdelta);
|
||||
// Take segment weighted average for estimated bits.
|
||||
estimated_bits = (int)((1.0 - weight_segment) *
|
||||
vp9_estimate_bits_at_q(cm->frame_type, cm->base_qindex, mbs,
|
||||
@ -155,6 +161,8 @@ int vp9_cyclic_refresh_estimate_bits_at_q(const VP9_COMP *cpi,
|
||||
// Prior to encoding the frame, estimate the bits per mb, for a given q = i and
|
||||
// a corresponding delta-q (for segment 1). This function is called in the
|
||||
// rc_regulate_q() to set the base qp index.
|
||||
// Note: the segment map is set to either 0/CR_SEGMENT_ID_BASE (no refresh) or
|
||||
// to 1/CR_SEGMENT_ID_BOOST1 (refresh) for each superblock, prior to encoding.
|
||||
int vp9_cyclic_refresh_rc_bits_per_mb(const VP9_COMP *cpi, int i,
|
||||
double correction_factor) {
|
||||
const VP9_COMMON *const cm = &cpi->common;
|
||||
@ -171,7 +179,7 @@ int vp9_cyclic_refresh_rc_bits_per_mb(const VP9_COMP *cpi, int i,
|
||||
// does not occur/is very small.
|
||||
double weight_segment = (double)cr->target_num_seg_blocks / num8x8bl;
|
||||
// Compute delta-q corresponding to qindex i.
|
||||
int deltaq = compute_deltaq(cpi, i);
|
||||
int deltaq = compute_deltaq(cpi, i, cr->rate_ratio_qdelta);
|
||||
// Take segment weighted average for bits per mb.
|
||||
bits_per_mb = (int)((1.0 - weight_segment) *
|
||||
vp9_rc_bits_per_mb(cm->frame_type, i, correction_factor, cm->bit_depth) +
|
||||
@ -197,20 +205,22 @@ void vp9_cyclic_refresh_update_segment(VP9_COMP *const cpi,
|
||||
const int xmis = MIN(cm->mi_cols - mi_col, bw);
|
||||
const int ymis = MIN(cm->mi_rows - mi_row, bh);
|
||||
const int block_index = mi_row * cm->mi_cols + mi_col;
|
||||
const int refresh_this_block = candidate_refresh_aq(cr, mbmi, rate, dist);
|
||||
const int refresh_this_block = candidate_refresh_aq(cr, mbmi, rate, dist,
|
||||
bsize);
|
||||
// Default is to not update the refresh map.
|
||||
int new_map_value = cr->map[block_index];
|
||||
int x = 0; int y = 0;
|
||||
|
||||
// Check if we should reset the segment_id for this block.
|
||||
if (mbmi->segment_id > 0 && !refresh_this_block)
|
||||
mbmi->segment_id = 0;
|
||||
// If this block is labeled for refresh, check if we should reset the
|
||||
// segment_id.
|
||||
if (mbmi->segment_id != CR_SEGMENT_ID_BASE)
|
||||
mbmi->segment_id = refresh_this_block;
|
||||
|
||||
// Update the cyclic refresh map, to be used for setting segmentation map
|
||||
// for the next frame. If the block will be refreshed this frame, mark it
|
||||
// as clean. The magnitude of the -ve influences how long before we consider
|
||||
// it for refresh again.
|
||||
if (mbmi->segment_id == 1) {
|
||||
if (mbmi->segment_id != CR_SEGMENT_ID_BASE) {
|
||||
new_map_value = -cr->time_for_refresh;
|
||||
} else if (refresh_this_block) {
|
||||
// Else if it is accepted as candidate for refresh, and has not already
|
||||
@ -242,20 +252,24 @@ void vp9_cyclic_refresh_update_actual_count(struct VP9_COMP *const cpi) {
|
||||
cr->actual_num_seg_blocks = 0;
|
||||
for (mi_row = 0; mi_row < cm->mi_rows; mi_row++)
|
||||
for (mi_col = 0; mi_col < cm->mi_cols; mi_col++) {
|
||||
if (seg_map[mi_row * cm->mi_cols + mi_col] == 1)
|
||||
if (seg_map[mi_row * cm->mi_cols + mi_col] != CR_SEGMENT_ID_BASE)
|
||||
cr->actual_num_seg_blocks++;
|
||||
}
|
||||
}
|
||||
|
||||
// Update the segmentation map, and related quantities: cyclic refresh map,
|
||||
// refresh sb_index, and target number of blocks to be refreshed.
|
||||
// The map is set to either 0/CR_SEGMENT_ID_BASE (no refresh) or to
|
||||
// 1/CR_SEGMENT_ID_BOOST1 (refresh) for each superblock.
|
||||
// Blocks labeled as BOOST1 may later get set to BOOST2 (during the
|
||||
// encoding of the superblock).
|
||||
void vp9_cyclic_refresh_update_map(VP9_COMP *const cpi) {
|
||||
VP9_COMMON *const cm = &cpi->common;
|
||||
CYCLIC_REFRESH *const cr = cpi->cyclic_refresh;
|
||||
unsigned char *const seg_map = cpi->segmentation_map;
|
||||
int i, block_count, bl_index, sb_rows, sb_cols, sbs_in_frame;
|
||||
int xmis, ymis, x, y;
|
||||
vpx_memset(seg_map, 0, cm->mi_rows * cm->mi_cols);
|
||||
vpx_memset(seg_map, CR_SEGMENT_ID_BASE, cm->mi_rows * cm->mi_cols);
|
||||
sb_cols = (cm->mi_cols + MI_BLOCK_SIZE - 1) / MI_BLOCK_SIZE;
|
||||
sb_rows = (cm->mi_rows + MI_BLOCK_SIZE - 1) / MI_BLOCK_SIZE;
|
||||
sbs_in_frame = sb_cols * sb_rows;
|
||||
@ -300,7 +314,7 @@ void vp9_cyclic_refresh_update_map(VP9_COMP *const cpi) {
|
||||
if (sum_map >= xmis * ymis / 2) {
|
||||
for (y = 0; y < ymis; y++)
|
||||
for (x = 0; x < xmis; x++) {
|
||||
seg_map[bl_index + y * cm->mi_cols + x] = 1;
|
||||
seg_map[bl_index + y * cm->mi_cols + x] = CR_SEGMENT_ID_BOOST1;
|
||||
}
|
||||
cr->target_num_seg_blocks += xmis * ymis;
|
||||
}
|
||||
@ -352,11 +366,11 @@ void vp9_cyclic_refresh_setup(VP9_COMP *const cpi) {
|
||||
vp9_clear_system_state();
|
||||
cr->max_qdelta_perc = 50;
|
||||
cr->time_for_refresh = 0;
|
||||
// Set rate threshold to some fraction (set to 1 for now) of the target
|
||||
// Set rate threshold to some multiple (set to 2 for now) of the target
|
||||
// rate (target is given by sb64_target_rate and scaled by 256).
|
||||
cr->thresh_rate_sb = (rc->sb64_target_rate << 8);
|
||||
cr->thresh_rate_sb = (rc->sb64_target_rate << 8) << 1;
|
||||
// Distortion threshold, quadratic in Q, scale factor to be adjusted.
|
||||
cr->thresh_dist_sb = (int)(q * q) << 5;
|
||||
cr->thresh_dist_sb = (int)(q * q) << 2;
|
||||
cr->motion_thresh = 32;
|
||||
// Set up segmentation.
|
||||
// Clear down the segment map.
|
||||
@ -372,19 +386,27 @@ void vp9_cyclic_refresh_setup(VP9_COMP *const cpi) {
|
||||
// relative to 0 previous map.
|
||||
// seg->temporal_update = 0;
|
||||
|
||||
// Segment 0 "Q" feature is disabled so it defaults to the baseline Q.
|
||||
vp9_disable_segfeature(seg, 0, SEG_LVL_ALT_Q);
|
||||
// Use segment 1 for in-frame Q adjustment.
|
||||
vp9_enable_segfeature(seg, 1, SEG_LVL_ALT_Q);
|
||||
// Segment BASE "Q" feature is disabled so it defaults to the baseline Q.
|
||||
vp9_disable_segfeature(seg, CR_SEGMENT_ID_BASE, SEG_LVL_ALT_Q);
|
||||
// Use segment BOOST1 for in-frame Q adjustment.
|
||||
vp9_enable_segfeature(seg, CR_SEGMENT_ID_BOOST1, SEG_LVL_ALT_Q);
|
||||
// Use segment BOOST2 for more aggressive in-frame Q adjustment.
|
||||
vp9_enable_segfeature(seg, CR_SEGMENT_ID_BOOST2, SEG_LVL_ALT_Q);
|
||||
|
||||
// Set the q delta for segment 1.
|
||||
qindex_delta = compute_deltaq(cpi, cm->base_qindex);
|
||||
// Set the q delta for segment BOOST1.
|
||||
qindex_delta = compute_deltaq(cpi, cm->base_qindex, cr->rate_ratio_qdelta);
|
||||
|
||||
// Compute rd-mult for segment 1.
|
||||
// Compute rd-mult for segment BOOST1.
|
||||
qindex2 = clamp(cm->base_qindex + cm->y_dc_delta_q + qindex_delta, 0, MAXQ);
|
||||
cr->rdmult = vp9_compute_rd_mult(cpi, qindex2);
|
||||
|
||||
vp9_set_segdata(seg, 1, SEG_LVL_ALT_Q, qindex_delta);
|
||||
vp9_set_segdata(seg, CR_SEGMENT_ID_BOOST1, SEG_LVL_ALT_Q, qindex_delta);
|
||||
|
||||
// Set a more aggressive (higher) q delta for segment BOOST2.
|
||||
qindex_delta = compute_deltaq(cpi, cm->base_qindex,
|
||||
MIN(CR_MAX_RATE_TARGET_RATIO,
|
||||
CR_BOOST2_FAC * cr->rate_ratio_qdelta));
|
||||
vp9_set_segdata(seg, CR_SEGMENT_ID_BOOST2, SEG_LVL_ALT_Q, qindex_delta);
|
||||
|
||||
// Update the segmentation and refresh map.
|
||||
vp9_cyclic_refresh_update_map(cpi);
|
||||
|
@ -18,6 +18,18 @@
|
||||
extern "C" {
|
||||
#endif
|
||||
|
||||
// The segment ids used in cyclic refresh: from base (no boost) to increasing
|
||||
// boost (higher delta-qp).
|
||||
#define CR_SEGMENT_ID_BASE 0
|
||||
#define CR_SEGMENT_ID_BOOST1 1
|
||||
#define CR_SEGMENT_ID_BOOST2 2
|
||||
|
||||
// Maximum rate target ratio for setting segment delta-qp.
|
||||
#define CR_MAX_RATE_TARGET_RATIO 4.0
|
||||
|
||||
// Boost factor for rate target ratio, for segment CR_SEGMENT_ID_BOOST2.
|
||||
#define CR_BOOST2_FAC 1.7
|
||||
|
||||
struct VP9_COMP;
|
||||
|
||||
struct CYCLIC_REFRESH;
|
||||
|
@ -403,7 +403,8 @@ static int set_vt_partitioning(VP9_COMP *cpi,
|
||||
int mi_row,
|
||||
int mi_col,
|
||||
int64_t threshold,
|
||||
BLOCK_SIZE bsize_min) {
|
||||
BLOCK_SIZE bsize_min,
|
||||
int segment_id) {
|
||||
VP9_COMMON * const cm = &cpi->common;
|
||||
variance_node vt;
|
||||
const int block_width = num_8x8_blocks_wide_lookup[bsize];
|
||||
@ -412,6 +413,10 @@ static int set_vt_partitioning(VP9_COMP *cpi,
|
||||
assert(block_height == block_width);
|
||||
tree_to_node(data, bsize, &vt);
|
||||
|
||||
// No 64x64 blocks on segments other than base (un-boosted) segment.
|
||||
if (segment_id != CR_SEGMENT_ID_BASE && bsize == BLOCK_64X64)
|
||||
return 0;
|
||||
|
||||
// For bsize=bsize_min (16x16/8x8 for 8x8/4x4 downsampling), select if
|
||||
// variance is below threshold, otherwise split will be selected.
|
||||
// No check for vert/horiz split as too few samples for variance.
|
||||
@ -645,6 +650,13 @@ static void choose_partitioning(VP9_COMP *cpi,
|
||||
const int low_res = (cm->width <= 352 && cm->height <= 288);
|
||||
int variance4x4downsample[16];
|
||||
|
||||
int segment_id = CR_SEGMENT_ID_BASE;
|
||||
if (cpi->oxcf.aq_mode == CYCLIC_REFRESH_AQ && cm->seg.enabled) {
|
||||
const uint8_t *const map = cm->seg.update_map ? cpi->segmentation_map :
|
||||
cm->last_frame_seg_map;
|
||||
segment_id = vp9_get_segment_id(cm, map, BLOCK_64X64, mi_row, mi_col);
|
||||
}
|
||||
|
||||
set_offsets(cpi, tile, x, mi_row, mi_col, BLOCK_64X64);
|
||||
|
||||
if (xd->mb_to_right_edge < 0)
|
||||
@ -817,7 +829,8 @@ static void choose_partitioning(VP9_COMP *cpi,
|
||||
// we get to one that's got a variance lower than our threshold.
|
||||
if ( mi_col + 8 > cm->mi_cols || mi_row + 8 > cm->mi_rows ||
|
||||
!set_vt_partitioning(cpi, xd, &vt, BLOCK_64X64, mi_row, mi_col,
|
||||
cpi->vbp_threshold_bsize_max, BLOCK_16X16)) {
|
||||
cpi->vbp_threshold_bsize_max, BLOCK_16X16,
|
||||
segment_id)) {
|
||||
for (i = 0; i < 4; ++i) {
|
||||
const int x32_idx = ((i & 1) << 2);
|
||||
const int y32_idx = ((i >> 1) << 2);
|
||||
@ -825,7 +838,7 @@ static void choose_partitioning(VP9_COMP *cpi,
|
||||
if (!set_vt_partitioning(cpi, xd, &vt.split[i], BLOCK_32X32,
|
||||
(mi_row + y32_idx), (mi_col + x32_idx),
|
||||
cpi->vbp_threshold,
|
||||
BLOCK_16X16)) {
|
||||
BLOCK_16X16, segment_id)) {
|
||||
for (j = 0; j < 4; ++j) {
|
||||
const int x16_idx = ((j & 1) << 1);
|
||||
const int y16_idx = ((j >> 1) << 1);
|
||||
@ -839,7 +852,7 @@ static void choose_partitioning(VP9_COMP *cpi,
|
||||
mi_row + y32_idx + y16_idx,
|
||||
mi_col + x32_idx + x16_idx,
|
||||
cpi->vbp_threshold_16x16,
|
||||
cpi->vbp_bsize_min)) {
|
||||
cpi->vbp_bsize_min, segment_id)) {
|
||||
for (k = 0; k < 4; ++k) {
|
||||
const int x8_idx = (k & 1);
|
||||
const int y8_idx = (k >> 1);
|
||||
@ -849,7 +862,7 @@ static void choose_partitioning(VP9_COMP *cpi,
|
||||
mi_row + y32_idx + y16_idx + y8_idx,
|
||||
mi_col + x32_idx + x16_idx + x8_idx,
|
||||
cpi->vbp_threshold_bsize_min,
|
||||
BLOCK_8X8)) {
|
||||
BLOCK_8X8, segment_id)) {
|
||||
set_block_size(cpi, xd,
|
||||
(mi_row + y32_idx + y16_idx + y8_idx),
|
||||
(mi_col + x32_idx + x16_idx + x8_idx),
|
||||
|
@ -242,9 +242,13 @@ static void model_rd_for_sb_y(VP9_COMP *cpi, BLOCK_SIZE bsize,
|
||||
else
|
||||
xd->mi[0].src_mi->mbmi.tx_size = TX_8X8;
|
||||
|
||||
if (cpi->sf.partition_search_type == VAR_BASED_PARTITION &&
|
||||
xd->mi[0].src_mi->mbmi.tx_size > TX_16X16)
|
||||
xd->mi[0].src_mi->mbmi.tx_size = TX_16X16;
|
||||
if (cpi->sf.partition_search_type == VAR_BASED_PARTITION) {
|
||||
if (cpi->oxcf.aq_mode == CYCLIC_REFRESH_AQ &&
|
||||
xd->mi[0].src_mi->mbmi.segment_id != CR_SEGMENT_ID_BASE)
|
||||
xd->mi[0].src_mi->mbmi.tx_size = TX_8X8;
|
||||
else if (xd->mi[0].src_mi->mbmi.tx_size > TX_16X16)
|
||||
xd->mi[0].src_mi->mbmi.tx_size = TX_16X16;
|
||||
}
|
||||
} else {
|
||||
xd->mi[0].src_mi->mbmi.tx_size =
|
||||
MIN(max_txsize_lookup[bsize],
|
||||
|
Loading…
x
Reference in New Issue
Block a user