x86/hevc_sao: use unaligned movs for sao_{band,filter} with width 8
Suggested-by: Christophe Gisquet <christophe.gisquet@gmail.com> Reviewed-by: Michael Niedermayer <michaelni@gmx.at> Signed-off-by: James Almer <jamrial@gmail.com>
This commit is contained in:
parent
88ec5435bb
commit
5c8f747085
@ -193,10 +193,10 @@ cglobal hevc_sao_band_filter_%2_%1, 6, 6, 15, 7*mmsize*ARCH_X86_32, dst, src, ds
|
|||||||
align 16
|
align 16
|
||||||
.loop
|
.loop
|
||||||
%if %2 == 8
|
%if %2 == 8
|
||||||
mova m8, [srcq]
|
movu m8, [srcq]
|
||||||
HEVC_SAO_BAND_FILTER_COMPUTE %1, m9, m8
|
HEVC_SAO_BAND_FILTER_COMPUTE %1, m9, m8
|
||||||
CLIPW m8, m14, m13
|
CLIPW m8, m14, m13
|
||||||
mova [dstq], m8
|
movu [dstq], m8
|
||||||
%endif
|
%endif
|
||||||
|
|
||||||
%assign i 0
|
%assign i 0
|
||||||
@ -537,7 +537,7 @@ align 16
|
|||||||
|
|
||||||
HEVC_SAO_EDGE_FILTER_COMPUTE_10
|
HEVC_SAO_EDGE_FILTER_COMPUTE_10
|
||||||
CLIPW m2, m0, [pw_mask %+ %1]
|
CLIPW m2, m0, [pw_mask %+ %1]
|
||||||
mova [dstq], m2
|
movu [dstq], m2
|
||||||
%endif
|
%endif
|
||||||
|
|
||||||
%assign i 0
|
%assign i 0
|
||||||
|
Loading…
Reference in New Issue
Block a user