cd907b1601
rebased. This patch includes 16x16 butterfly inverse ADST/DCT hybrid transform. It uses the variant ADST of kernel sin((2k+1)*(2n+1)/4N), which allows a butterfly implementation. The coding gains as compared to DCT 16x16 are about 0.1% for both derf and std-hd. It is noteworthy that for std-hd sets many sequences gains about 0.5%, some 0.2%. There are also few points that provides -1% to -3% performance. Hence the average goes to about 0.1%. Change-Id: Ie80ac84cf403390f6e5d282caa58723739e5ec17
145 lines
4.3 KiB
C
145 lines
4.3 KiB
C
/*
|
|
* Copyright (c) 2010 The WebM project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#include "vp9/common/vp9_invtrans.h"
|
|
#include "./vp9_rtcd.h"
|
|
|
|
void vp9_inverse_transform_b_4x4(MACROBLOCKD *xd, int block, int pitch) {
|
|
BLOCKD *b = &xd->block[block];
|
|
if (b->eob <= 1)
|
|
xd->inv_txm4x4_1(b->dqcoeff, b->diff, pitch);
|
|
else
|
|
xd->inv_txm4x4(b->dqcoeff, b->diff, pitch);
|
|
}
|
|
|
|
void vp9_inverse_transform_mby_4x4(MACROBLOCKD *xd) {
|
|
int i;
|
|
|
|
for (i = 0; i < 16; i++) {
|
|
TX_TYPE tx_type = get_tx_type_4x4(xd, &xd->block[i]);
|
|
if (tx_type != DCT_DCT) {
|
|
#if CONFIG_INTHT4X4
|
|
vp9_short_iht4x4(xd->block[i].dqcoeff, xd->block[i].diff,
|
|
32, tx_type);
|
|
#else
|
|
vp9_ihtllm(xd->block[i].dqcoeff, xd->block[i].diff, 32,
|
|
tx_type, 4, xd->block[i].eob);
|
|
#endif
|
|
} else {
|
|
vp9_inverse_transform_b_4x4(xd, i, 32);
|
|
}
|
|
}
|
|
}
|
|
|
|
void vp9_inverse_transform_mbuv_4x4(MACROBLOCKD *xd) {
|
|
int i;
|
|
|
|
for (i = 16; i < 24; i++) {
|
|
vp9_inverse_transform_b_4x4(xd, i, 16);
|
|
}
|
|
}
|
|
|
|
void vp9_inverse_transform_mb_4x4(MACROBLOCKD *xd) {
|
|
vp9_inverse_transform_mby_4x4(xd);
|
|
vp9_inverse_transform_mbuv_4x4(xd);
|
|
}
|
|
|
|
void vp9_inverse_transform_b_8x8(int16_t *input_dqcoeff, int16_t *output_coeff,
|
|
int pitch) {
|
|
vp9_short_idct8x8(input_dqcoeff, output_coeff, pitch);
|
|
}
|
|
|
|
void vp9_inverse_transform_mby_8x8(MACROBLOCKD *xd) {
|
|
int i;
|
|
BLOCKD *blockd = xd->block;
|
|
|
|
for (i = 0; i < 9; i += 8) {
|
|
TX_TYPE tx_type = get_tx_type_8x8(xd, &xd->block[i]);
|
|
if (tx_type != DCT_DCT) {
|
|
#if CONFIG_INTHT
|
|
vp9_short_iht8x8(xd->block[i].dqcoeff, xd->block[i].diff,
|
|
32, tx_type);
|
|
#else
|
|
vp9_ihtllm(xd->block[i].dqcoeff, xd->block[i].diff, 32, tx_type, 8,
|
|
xd->block[i].eob);
|
|
#endif
|
|
} else {
|
|
vp9_inverse_transform_b_8x8(&blockd[i].dqcoeff[0],
|
|
&blockd[i].diff[0], 32);
|
|
}
|
|
}
|
|
for (i = 2; i < 11; i += 8) {
|
|
TX_TYPE tx_type = get_tx_type_8x8(xd, &xd->block[i]);
|
|
if (tx_type != DCT_DCT) {
|
|
#if CONFIG_INTHT
|
|
vp9_short_iht8x8(xd->block[i + 2].dqcoeff, xd->block[i].diff,
|
|
32, tx_type);
|
|
#else
|
|
vp9_ihtllm(xd->block[i + 2].dqcoeff, xd->block[i].diff, 32, tx_type, 8,
|
|
xd->block[i + 2].eob);
|
|
#endif
|
|
} else {
|
|
vp9_inverse_transform_b_8x8(&blockd[i + 2].dqcoeff[0],
|
|
&blockd[i].diff[0], 32);
|
|
}
|
|
}
|
|
}
|
|
|
|
void vp9_inverse_transform_mbuv_8x8(MACROBLOCKD *xd) {
|
|
int i;
|
|
BLOCKD *blockd = xd->block;
|
|
|
|
for (i = 16; i < 24; i += 4) {
|
|
vp9_inverse_transform_b_8x8(&blockd[i].dqcoeff[0],
|
|
&blockd[i].diff[0], 16);
|
|
}
|
|
}
|
|
|
|
void vp9_inverse_transform_mb_8x8(MACROBLOCKD *xd) {
|
|
vp9_inverse_transform_mby_8x8(xd);
|
|
vp9_inverse_transform_mbuv_8x8(xd);
|
|
}
|
|
|
|
void vp9_inverse_transform_b_16x16(int16_t *input_dqcoeff,
|
|
int16_t *output_coeff, int pitch) {
|
|
vp9_short_idct16x16(input_dqcoeff, output_coeff, pitch);
|
|
}
|
|
|
|
void vp9_inverse_transform_mby_16x16(MACROBLOCKD *xd) {
|
|
BLOCKD *bd = &xd->block[0];
|
|
TX_TYPE tx_type = get_tx_type_16x16(xd, bd);
|
|
if (tx_type != DCT_DCT) {
|
|
#if CONFIG_INTHT16X16
|
|
vp9_short_iht16x16(bd->dqcoeff, bd->diff, 32, tx_type);
|
|
#else
|
|
vp9_ihtllm(bd->dqcoeff, bd->diff, 32, tx_type, 16, bd->eob);
|
|
#endif
|
|
} else {
|
|
vp9_inverse_transform_b_16x16(&xd->block[0].dqcoeff[0],
|
|
&xd->block[0].diff[0], 32);
|
|
}
|
|
}
|
|
|
|
void vp9_inverse_transform_mb_16x16(MACROBLOCKD *xd) {
|
|
vp9_inverse_transform_mby_16x16(xd);
|
|
vp9_inverse_transform_mbuv_8x8(xd);
|
|
}
|
|
|
|
void vp9_inverse_transform_sby_32x32(SUPERBLOCKD *xd_sb) {
|
|
vp9_short_idct32x32(xd_sb->dqcoeff, xd_sb->diff, 64);
|
|
}
|
|
|
|
void vp9_inverse_transform_sbuv_16x16(SUPERBLOCKD *xd_sb) {
|
|
vp9_inverse_transform_b_16x16(xd_sb->dqcoeff + 1024,
|
|
xd_sb->diff + 1024, 32);
|
|
vp9_inverse_transform_b_16x16(xd_sb->dqcoeff + 1280,
|
|
xd_sb->diff + 1280, 32);
|
|
}
|