From 6b2bedfe2810c6c5dd9b3481fe5ab9e9348387a9 Mon Sep 17 00:00:00 2001 From: Roy Oursler Date: Tue, 26 Jul 2016 11:08:30 -0700 Subject: [PATCH] igzip: Fix to run on SSE Signed-off-by: Roy Oursler Reviewed-by: Greg Tucker --- igzip/igzip_decode_block_stateless.asm | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/igzip/igzip_decode_block_stateless.asm b/igzip/igzip_decode_block_stateless.asm index b00bab7..38c5cec 100644 --- a/igzip/igzip_decode_block_stateless.asm +++ b/igzip/igzip_decode_block_stateless.asm @@ -398,7 +398,7 @@ decode_len_dist: ;; ;; Check if a valid look back distances was decoded cmp copy_start, [rsp + start_out_mem_offset] jl invalid_look_back_distance - vmovdqu xmm1, [copy_start] + MOVDQU xmm1, [copy_start] ;; Set tmp2 to be the minimum of COPY_SIZE and repeat_length ;; This is to decrease use of small_byte_copy branch @@ -412,23 +412,23 @@ decode_len_dist: large_byte_copy: ;; Copy length distance pair when memory overlap is not an issue - vmovdqu [copy_start + look_back_dist2], xmm1 + MOVDQU [copy_start + look_back_dist2], xmm1 sub repeat_length, COPY_SIZE jle loop_block add copy_start, COPY_SIZE - vmovdqu xmm1, [copy_start] + MOVDQU xmm1, [copy_start] jmp large_byte_copy small_byte_copy_pre: ;; Copy length distance pair when source and destination overlap add repeat_length, look_back_dist2 small_byte_copy: - vmovdqu [copy_start + look_back_dist2], xmm1 + MOVDQU [copy_start + look_back_dist2], xmm1 shl look_back_dist2, 1 - vmovdqu xmm1, [copy_start] + MOVDQU xmm1, [copy_start] cmp look_back_dist2, COPY_SIZE jl small_byte_copy