705f5e5e15
~25% faster dts decoding overall. The checkasm CPU cycles numbers are not that useful since synth_filter_float() calls FFTContext.imdct_half(). cortex-a57 cortex-a53 synth_filter_float_c: 1866.2 3490.9 synth_filter_float_neon: 915.0 1531.5 With fftc.imdct_half forced to imdct_half_neon: cortex-a57 cortex-a53 synth_filter_float_c: 1718.4 3025.3 synth_filter_float_neon: 926.2 1530.1
34 lines
1.3 KiB
C
34 lines
1.3 KiB
C
/*
|
|
* This file is part of Libav.
|
|
*
|
|
* Libav is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* Libav is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with Libav; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#ifndef AVCODEC_AARCH64_ASM_OFFSETS_H
|
|
#define AVCODEC_AARCH64_ASM_OFFSETS_H
|
|
|
|
/* CeltIMDCTContext */
|
|
#define CELT_EXPTAB 0x20
|
|
#define CELT_FFT_N 0x00
|
|
#define CELT_LEN2 0x04
|
|
#define CELT_LEN4 (CELT_LEN2 + 0x4) // loaded as pair
|
|
#define CELT_TMP 0x10
|
|
#define CELT_TWIDDLE (CELT_TMP + 0x8) // loaded as pair
|
|
|
|
/* FFTContext */
|
|
#define IMDCT_HALF 0x48
|
|
|
|
#endif /* AVCODEC_AARCH64_ASM_OFFSETS_H */
|