Merge "Speed up h_predictor_4x4"

This commit is contained in:
James Zern
2015-11-21 01:12:42 +00:00
committed by Gerrit Code Review

View File

@@ -33,23 +33,20 @@ sh_b2333: db 2, 3, 3, 3, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
SECTION .text SECTION .text
INIT_MMX ssse3 INIT_XMM ssse3
cglobal h_predictor_4x4, 2, 4, 3, dst, stride, line, left cglobal h_predictor_4x4, 2, 4, 3, dst, stride, line, left
movifnidn leftq, leftmp movd m0, [leftq]
add leftq, 4 punpcklbw m0, m0
mov lineq, -2 punpcklbw m0, m0
pxor m0, m0 movd [dstq ], m0
.loop: psrldq m0, 4
movd m1, [leftq+lineq*2 ] movd [dstq+strideq], m0
movd m2, [leftq+lineq*2+1]
pshufb m1, m0
pshufb m2, m0
movd [dstq ], m1
movd [dstq+strideq], m2
lea dstq, [dstq+strideq*2] lea dstq, [dstq+strideq*2]
inc lineq psrldq m0, 4
jnz .loop movd [dstq ], m0
REP_RET psrldq m0, 4
movd [dstq+strideq], m0
RET
INIT_MMX ssse3 INIT_MMX ssse3
cglobal h_predictor_8x8, 2, 4, 3, dst, stride, line, left cglobal h_predictor_8x8, 2, 4, 3, dst, stride, line, left