From 525dbe7093af25cfe993f0e16ace2ff3685e1aad Mon Sep 17 00:00:00 2001 From: Karina Date: Thu, 14 Apr 2016 10:06:57 +0800 Subject: [PATCH] add 32-bit parameter sign-extentions for block_add_aarch64_neon.S --- codec/decoder/core/arm64/block_add_aarch64_neon.S | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/codec/decoder/core/arm64/block_add_aarch64_neon.S b/codec/decoder/core/arm64/block_add_aarch64_neon.S index e2066d20..d6558ea2 100644 --- a/codec/decoder/core/arm64/block_add_aarch64_neon.S +++ b/codec/decoder/core/arm64/block_add_aarch64_neon.S @@ -68,7 +68,7 @@ // uint8_t *pred, const int32_t stride, int16_t *rs WELS_ASM_AARCH64_FUNC_BEGIN IdctResAddPred_AArch64_neon - + SIGN_EXTENSION x1,w1 ld4 {v0.4h, v1.4h, v2.4h, v3.4h}, [x2] // cost 3 cycles! ROW_TRANSFORM_1_STEP v0, v1, v2, v3, v16, v17, v18, v19, v4, v5 TRANSFORM_4BYTES v0, v1, v2, v3, v16, v17, v18, v19 @@ -113,6 +113,7 @@ WELS_ASM_AARCH64_FUNC_END WELS_ASM_AARCH64_FUNC_BEGIN WelsBlockZero16x16_AArch64_neon eor v0.16b, v0.16b, v0.16b eor v1.16b, v1.16b, v1.16b + SIGN_EXTENSION x1,w1 lsl x1, x1, 1 .rept 16 st1 {v0.16b, v1.16b}, [x0], x1