 5a92284167
			
		
	
	5a92284167
	
	
	
		
			
			Add following functions: bcopy, memcpy, memmove, memset, bzero, memcmp, wmemcmp, strlen, strcpy, strncpy, stpcpy, stpncpy. Create new directories inside arch-x86 to specify architecture: atom, silvermont and generic (non atom or silvermont architectures are treated like generic). Due to introducing optimized versions of stpcpy and stpncpy, c-implementations of these functions are moved from common for architectures makefile to arm and mips specific makefiles. Change-Id: I990f8061c3e9bca1f154119303da9e781c5d086e Signed-off-by: Varvara Rainchik <varvara.rainchik@intel.com>
		
			
				
	
	
		
			392 lines
		
	
	
		
			6.8 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
			
		
		
	
	
			392 lines
		
	
	
		
			6.8 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
| /*
 | |
| Copyright (c) 2011, Intel Corporation
 | |
| All rights reserved.
 | |
| 
 | |
| Redistribution and use in source and binary forms, with or without
 | |
| modification, are permitted provided that the following conditions are met:
 | |
| 
 | |
|     * Redistributions of source code must retain the above copyright notice,
 | |
|     * this list of conditions and the following disclaimer.
 | |
| 
 | |
|     * Redistributions in binary form must reproduce the above copyright notice,
 | |
|     * this list of conditions and the following disclaimer in the documentation
 | |
|     * and/or other materials provided with the distribution.
 | |
| 
 | |
|     * Neither the name of Intel Corporation nor the names of its contributors
 | |
|     * may be used to endorse or promote products derived from this software
 | |
|     * without specific prior written permission.
 | |
| 
 | |
| THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
 | |
| ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 | |
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 | |
| DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
 | |
| ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 | |
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 | |
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
 | |
| ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 | |
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 | |
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 | |
| */
 | |
| 
 | |
| #ifndef L
 | |
| # define L(label)	.L##label
 | |
| #endif
 | |
| 
 | |
| #ifndef cfi_startproc
 | |
| # define cfi_startproc	.cfi_startproc
 | |
| #endif
 | |
| 
 | |
| #ifndef cfi_endproc
 | |
| # define cfi_endproc	.cfi_endproc
 | |
| #endif
 | |
| 
 | |
| #ifndef cfi_rel_offset
 | |
| # define cfi_rel_offset(reg, off)	.cfi_rel_offset reg, off
 | |
| #endif
 | |
| 
 | |
| #ifndef cfi_restore
 | |
| # define cfi_restore(reg)	.cfi_restore reg
 | |
| #endif
 | |
| 
 | |
| #ifndef cfi_adjust_cfa_offset
 | |
| # define cfi_adjust_cfa_offset(off)	.cfi_adjust_cfa_offset off
 | |
| #endif
 | |
| 
 | |
| #ifndef ENTRY
 | |
| # define ENTRY(name)	\
 | |
| 	.type name,  @function;	\
 | |
| 	.globl name;	\
 | |
| 	.p2align 4;	\
 | |
| name:	\
 | |
| 	cfi_startproc
 | |
| #endif
 | |
| 
 | |
| #ifndef END
 | |
| # define END(name)	\
 | |
| 	cfi_endproc;	\
 | |
| 	.size name,	.-name
 | |
| #endif
 | |
| 
 | |
| #define CFI_PUSH(REG)	\
 | |
| 	cfi_adjust_cfa_offset (4);	\
 | |
| 	cfi_rel_offset (REG, 0)
 | |
| 
 | |
| #define CFI_POP(REG)	\
 | |
| 	cfi_adjust_cfa_offset (-4);	\
 | |
| 	cfi_restore (REG)
 | |
| 
 | |
| #define PUSH(REG)	pushl REG;	CFI_PUSH (REG)
 | |
| #define POP(REG)	popl REG;	CFI_POP (REG)
 | |
| 
 | |
| #define PARMS	8
 | |
| #define ENTRANCE	PUSH(%edi)
 | |
| #define RETURN	POP (%edi); ret; CFI_PUSH (%edi);
 | |
| 
 | |
| 
 | |
| #define STR1	PARMS
 | |
| #define STR2	STR1+4
 | |
| 
 | |
| 	.text
 | |
| ENTRY (strchr)
 | |
| 
 | |
| 	ENTRANCE
 | |
| 	mov	STR1(%esp), %ecx
 | |
| 	movd	STR2(%esp), %xmm1
 | |
| 
 | |
| 	pxor	%xmm2, %xmm2
 | |
| 	mov	%ecx, %edi
 | |
| 	punpcklbw %xmm1, %xmm1
 | |
| 	punpcklbw %xmm1, %xmm1
 | |
| 	/* ECX has OFFSET. */
 | |
| 	and	$15, %ecx
 | |
| 	pshufd	$0, %xmm1, %xmm1
 | |
| 	je	L(loop)
 | |
| 
 | |
| /* Handle unaligned string.  */
 | |
| 	and	$-16, %edi
 | |
| 	movdqa	(%edi), %xmm0
 | |
| 	pcmpeqb	%xmm0, %xmm2
 | |
| 	pcmpeqb	%xmm1, %xmm0
 | |
| 	/* Find where NULL is.  */
 | |
| 	pmovmskb %xmm2, %edx
 | |
| 	/* Check if there is a match.  */
 | |
| 	pmovmskb %xmm0, %eax
 | |
| 	/* Remove the leading bytes.  */
 | |
| 	sarl	%cl, %edx
 | |
| 	sarl	%cl, %eax
 | |
| 	test	%eax, %eax
 | |
| 	jz	L(unaligned_no_match)
 | |
| 	add	%ecx, %edi
 | |
| 	test	%edx, %edx
 | |
| 	jz	L(match_case1)
 | |
| 	jmp	L(match_case2)
 | |
| 
 | |
| 	.p2align 4
 | |
| L(unaligned_no_match):
 | |
| 	test	%edx, %edx
 | |
| 	jne	L(return_null)
 | |
| 
 | |
| 	pxor	%xmm2, %xmm2
 | |
| 	add	$16, %edi
 | |
| 
 | |
| 	.p2align 4
 | |
| /* Loop start on aligned string.  */
 | |
| L(loop):
 | |
| 	movdqa	(%edi), %xmm0
 | |
| 	pcmpeqb	%xmm0, %xmm2
 | |
| 	pcmpeqb	%xmm1, %xmm0
 | |
| 	pmovmskb %xmm2, %edx
 | |
| 	pmovmskb %xmm0, %eax
 | |
| 	test	%eax, %eax
 | |
| 	jnz	L(matches)
 | |
| 	test	%edx, %edx
 | |
| 	jnz	L(return_null)
 | |
| 	add	$16, %edi
 | |
| 
 | |
| 	movdqa	(%edi), %xmm0
 | |
| 	pcmpeqb	%xmm0, %xmm2
 | |
| 	pcmpeqb	%xmm1, %xmm0
 | |
| 	pmovmskb %xmm2, %edx
 | |
| 	pmovmskb %xmm0, %eax
 | |
| 	test	%eax, %eax
 | |
| 	jnz	L(matches)
 | |
| 	test	%edx, %edx
 | |
| 	jnz	L(return_null)
 | |
| 	add	$16, %edi
 | |
| 
 | |
| 	movdqa	(%edi), %xmm0
 | |
| 	pcmpeqb	%xmm0, %xmm2
 | |
| 	pcmpeqb	%xmm1, %xmm0
 | |
| 	pmovmskb %xmm2, %edx
 | |
| 	pmovmskb %xmm0, %eax
 | |
| 	test	%eax, %eax
 | |
| 	jnz	L(matches)
 | |
| 	test	%edx, %edx
 | |
| 	jnz	L(return_null)
 | |
| 	add	$16, %edi
 | |
| 
 | |
| 	movdqa	(%edi), %xmm0
 | |
| 	pcmpeqb	%xmm0, %xmm2
 | |
| 	pcmpeqb	%xmm1, %xmm0
 | |
| 	pmovmskb %xmm2, %edx
 | |
| 	pmovmskb %xmm0, %eax
 | |
| 	test	%eax, %eax
 | |
| 	jnz	L(matches)
 | |
| 	test	%edx, %edx
 | |
| 	jnz	L(return_null)
 | |
| 	add	$16, %edi
 | |
| 	jmp	L(loop)
 | |
| 
 | |
| L(matches):
 | |
| 	/* There is a match.  First find where NULL is.  */
 | |
| 	test	%edx, %edx
 | |
| 	jz	L(match_case1)
 | |
| 
 | |
| 	.p2align 4
 | |
| L(match_case2):
 | |
| 	test	%al, %al
 | |
| 	jz	L(match_higth_case2)
 | |
| 
 | |
| 	mov	%al, %cl
 | |
| 	and	$15, %cl
 | |
| 	jnz	L(match_case2_4)
 | |
| 
 | |
| 	mov	%dl, %ch
 | |
| 	and	$15, %ch
 | |
| 	jnz	L(return_null)
 | |
| 
 | |
| 	test	$0x10, %al
 | |
| 	jnz	L(Exit5)
 | |
| 	test	$0x10, %dl
 | |
| 	jnz	L(return_null)
 | |
| 	test	$0x20, %al
 | |
| 	jnz	L(Exit6)
 | |
| 	test	$0x20, %dl
 | |
| 	jnz	L(return_null)
 | |
| 	test	$0x40, %al
 | |
| 	jnz	L(Exit7)
 | |
| 	test	$0x40, %dl
 | |
| 	jnz	L(return_null)
 | |
| 	lea	7(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(match_case2_4):
 | |
| 	test	$0x01, %al
 | |
| 	jnz	L(Exit1)
 | |
| 	test	$0x01, %dl
 | |
| 	jnz	L(return_null)
 | |
| 	test	$0x02, %al
 | |
| 	jnz	L(Exit2)
 | |
| 	test	$0x02, %dl
 | |
| 	jnz	L(return_null)
 | |
| 	test	$0x04, %al
 | |
| 	jnz	L(Exit3)
 | |
| 	test	$0x04, %dl
 | |
| 	jnz	L(return_null)
 | |
| 	lea	3(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(match_higth_case2):
 | |
| 	test	%dl, %dl
 | |
| 	jnz	L(return_null)
 | |
| 
 | |
| 	mov	%ah, %cl
 | |
| 	and	$15, %cl
 | |
| 	jnz	L(match_case2_12)
 | |
| 
 | |
| 	mov	%dh, %ch
 | |
| 	and	$15, %ch
 | |
| 	jnz	L(return_null)
 | |
| 
 | |
| 	test	$0x10, %ah
 | |
| 	jnz	L(Exit13)
 | |
| 	test	$0x10, %dh
 | |
| 	jnz	L(return_null)
 | |
| 	test	$0x20, %ah
 | |
| 	jnz	L(Exit14)
 | |
| 	test	$0x20, %dh
 | |
| 	jnz	L(return_null)
 | |
| 	test	$0x40, %ah
 | |
| 	jnz	L(Exit15)
 | |
| 	test	$0x40, %dh
 | |
| 	jnz	L(return_null)
 | |
| 	lea	15(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(match_case2_12):
 | |
| 	test	$0x01, %ah
 | |
| 	jnz	L(Exit9)
 | |
| 	test	$0x01, %dh
 | |
| 	jnz	L(return_null)
 | |
| 	test	$0x02, %ah
 | |
| 	jnz	L(Exit10)
 | |
| 	test	$0x02, %dh
 | |
| 	jnz	L(return_null)
 | |
| 	test	$0x04, %ah
 | |
| 	jnz	L(Exit11)
 | |
| 	test	$0x04, %dh
 | |
| 	jnz	L(return_null)
 | |
| 	lea	11(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(match_case1):
 | |
| 	test	%al, %al
 | |
| 	jz	L(match_higth_case1)
 | |
| 
 | |
| 	test	$0x01, %al
 | |
| 	jnz	L(Exit1)
 | |
| 	test	$0x02, %al
 | |
| 	jnz	L(Exit2)
 | |
| 	test	$0x04, %al
 | |
| 	jnz	L(Exit3)
 | |
| 	test	$0x08, %al
 | |
| 	jnz	L(Exit4)
 | |
| 	test	$0x10, %al
 | |
| 	jnz	L(Exit5)
 | |
| 	test	$0x20, %al
 | |
| 	jnz	L(Exit6)
 | |
| 	test	$0x40, %al
 | |
| 	jnz	L(Exit7)
 | |
| 	lea	7(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(match_higth_case1):
 | |
| 	test	$0x01, %ah
 | |
| 	jnz	L(Exit9)
 | |
| 	test	$0x02, %ah
 | |
| 	jnz	L(Exit10)
 | |
| 	test	$0x04, %ah
 | |
| 	jnz	L(Exit11)
 | |
| 	test	$0x08, %ah
 | |
| 	jnz	L(Exit12)
 | |
| 	test	$0x10, %ah
 | |
| 	jnz	L(Exit13)
 | |
| 	test	$0x20, %ah
 | |
| 	jnz	L(Exit14)
 | |
| 	test	$0x40, %ah
 | |
| 	jnz	L(Exit15)
 | |
| 	lea	15(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit1):
 | |
| 	lea	(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit2):
 | |
| 	lea	1(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit3):
 | |
| 	lea	2(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit4):
 | |
| 	lea	3(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit5):
 | |
| 	lea	4(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit6):
 | |
| 	lea	5(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit7):
 | |
| 	lea	6(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit9):
 | |
| 	lea	8(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit10):
 | |
| 	lea	9(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit11):
 | |
| 	lea	10(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit12):
 | |
| 	lea	11(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit13):
 | |
| 	lea	12(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit14):
 | |
| 	lea	13(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(Exit15):
 | |
| 	lea	14(%edi), %eax
 | |
| 	RETURN
 | |
| 
 | |
| 	.p2align 4
 | |
| L(return_null):
 | |
| 	xor	%eax, %eax
 | |
| 	RETURN
 | |
| 
 | |
| END (strchr)
 |