56f5a9a060
Jeff Muizelaar posted some changes to the idct/reconstruction c code. This is the equivalent update for the arm assembly. This shows a good boost on v6, and a minor boost on neon. Here are some numbers for highway in qcif, 2641 frames: HEAD neon: ~161 fps new neon: ~162 fps HEAD v6: ~102 fps new v6: ~106 fps The following functions have been updated for armv6 and neon: vp8_dc_only_idct_add vp8_dequant_idct_add vp8_dequant_dc_idct_add Conflicts: vp8/decoder/arm/armv6/dequantdcidct_v6.asm vp8/decoder/arm/armv6/dequantidct_v6.asm Resolved by removing these files. When I rewrote the functions, I also moved the files to dequant_dc_idct_v6.asm/dequant_idct_v6.asm Change-Id: Ie3300df824d52474eca1a5134cf22d8b7809a5d4
62 lines
1.8 KiB
C
62 lines
1.8 KiB
C
/*
|
|
* Copyright (c) 2010 The VP8 project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
|
|
#ifndef IDCT_ARM_H
|
|
#define IDCT_ARM_H
|
|
|
|
#if HAVE_ARMV6
|
|
extern prototype_idct(vp8_short_idct4x4llm_1_v6);
|
|
extern prototype_idct(vp8_short_idct4x4llm_v6_dual);
|
|
extern prototype_idct_scalar_add(vp8_dc_only_idct_add_v6);
|
|
extern prototype_second_order(vp8_short_inv_walsh4x4_1_v6);
|
|
extern prototype_second_order(vp8_short_inv_walsh4x4_v6);
|
|
|
|
#undef vp8_idct_idct1
|
|
#define vp8_idct_idct1 vp8_short_idct4x4llm_1_v6
|
|
|
|
#undef vp8_idct_idct16
|
|
#define vp8_idct_idct16 vp8_short_idct4x4llm_v6_dual
|
|
|
|
#undef vp8_idct_idct1_scalar_add
|
|
#define vp8_idct_idct1_scalar_add vp8_dc_only_idct_add_v6
|
|
|
|
#undef vp8_idct_iwalsh1
|
|
#define vp8_idct_iwalsh1 vp8_short_inv_walsh4x4_1_v6
|
|
|
|
#undef vp8_idct_iwalsh16
|
|
#define vp8_idct_iwalsh16 vp8_short_inv_walsh4x4_v6
|
|
#endif
|
|
|
|
#if HAVE_ARMV7
|
|
extern prototype_idct(vp8_short_idct4x4llm_1_neon);
|
|
extern prototype_idct(vp8_short_idct4x4llm_neon);
|
|
extern prototype_idct_scalar_add(vp8_dc_only_idct_add_neon);
|
|
extern prototype_second_order(vp8_short_inv_walsh4x4_1_neon);
|
|
extern prototype_second_order(vp8_short_inv_walsh4x4_neon);
|
|
|
|
#undef vp8_idct_idct1
|
|
#define vp8_idct_idct1 vp8_short_idct4x4llm_1_neon
|
|
|
|
#undef vp8_idct_idct16
|
|
#define vp8_idct_idct16 vp8_short_idct4x4llm_neon
|
|
|
|
#undef vp8_idct_idct1_scalar_add
|
|
#define vp8_idct_idct1_scalar_add vp8_dc_only_idct_add_neon
|
|
|
|
#undef vp8_idct_iwalsh1
|
|
#define vp8_idct_iwalsh1 vp8_short_inv_walsh4x4_1_neon
|
|
|
|
#undef vp8_idct_iwalsh16
|
|
#define vp8_idct_iwalsh16 vp8_short_inv_walsh4x4_neon
|
|
#endif
|
|
|
|
#endif
|