x86/hevc_mc: use aligned loads
Signed-off-by: Michael Niedermayer <michaelni@gmx.at>
This commit is contained in:
parent
383fddeec6
commit
6ecc3fd612
@ -771,7 +771,7 @@ typedef struct HEVCLocalContext {
|
|||||||
DECLARE_ALIGNED(32, uint8_t, edge_emu_buffer)[(MAX_PB_SIZE + 7) * EDGE_EMU_BUFFER_STRIDE * 2];
|
DECLARE_ALIGNED(32, uint8_t, edge_emu_buffer)[(MAX_PB_SIZE + 7) * EDGE_EMU_BUFFER_STRIDE * 2];
|
||||||
/* The extended size between the new edge emu buffer is abused by SAO */
|
/* The extended size between the new edge emu buffer is abused by SAO */
|
||||||
DECLARE_ALIGNED(32, uint8_t, edge_emu_buffer2)[(MAX_PB_SIZE + 7) * EDGE_EMU_BUFFER_STRIDE * 2];
|
DECLARE_ALIGNED(32, uint8_t, edge_emu_buffer2)[(MAX_PB_SIZE + 7) * EDGE_EMU_BUFFER_STRIDE * 2];
|
||||||
DECLARE_ALIGNED(16, int16_t, tmp [MAX_PB_SIZE * MAX_PB_SIZE]);
|
DECLARE_ALIGNED(32, int16_t, tmp [MAX_PB_SIZE * MAX_PB_SIZE]);
|
||||||
|
|
||||||
int ct_depth;
|
int ct_depth;
|
||||||
CodingUnit cu;
|
CodingUnit cu;
|
||||||
|
@ -103,14 +103,14 @@ QPEL_TABLE 10, 8, w, avx2
|
|||||||
%endif ;avx
|
%endif ;avx
|
||||||
%elif %1 <= 16
|
%elif %1 <= 16
|
||||||
%if cpuflag(avx2)
|
%if cpuflag(avx2)
|
||||||
movu %3, [%2]
|
mova %3, [%2]
|
||||||
%else
|
%else
|
||||||
movdqa %3, [%2] ; load data from source2
|
movdqa %3, [%2] ; load data from source2
|
||||||
movdqa %4, [%2+16] ; load data from source2
|
movdqa %4, [%2+16] ; load data from source2
|
||||||
%endif ; avx
|
%endif ; avx
|
||||||
%else ; %1 = 32
|
%else ; %1 = 32
|
||||||
movu %3, [%2]
|
mova %3, [%2]
|
||||||
movu %4, [%2+32]
|
mova %4, [%2+32]
|
||||||
%endif
|
%endif
|
||||||
%endmacro
|
%endmacro
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user