|  | /* | 
|  | Copyright (c) 2011, Intel Corporation | 
|  | All rights reserved. | 
|  |  | 
|  | Redistribution and use in source and binary forms, with or without | 
|  | modification, are permitted provided that the following conditions are met: | 
|  |  | 
|  | * Redistributions of source code must retain the above copyright notice, | 
|  | * this list of conditions and the following disclaimer. | 
|  |  | 
|  | * Redistributions in binary form must reproduce the above copyright notice, | 
|  | * this list of conditions and the following disclaimer in the documentation | 
|  | * and/or other materials provided with the distribution. | 
|  |  | 
|  | * Neither the name of Intel Corporation nor the names of its contributors | 
|  | * may be used to endorse or promote products derived from this software | 
|  | * without specific prior written permission. | 
|  |  | 
|  | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND | 
|  | ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | 
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE | 
|  | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR | 
|  | ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | 
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | 
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON | 
|  | ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | 
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | 
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | 
|  | */ | 
|  |  | 
|  | #ifndef L | 
|  | # define L(label)	.L##label | 
|  | #endif | 
|  |  | 
|  | #ifndef cfi_startproc | 
|  | # define cfi_startproc	.cfi_startproc | 
|  | #endif | 
|  |  | 
|  | #ifndef cfi_endproc | 
|  | # define cfi_endproc	.cfi_endproc | 
|  | #endif | 
|  |  | 
|  | #ifndef cfi_rel_offset | 
|  | # define cfi_rel_offset(reg, off)	.cfi_rel_offset reg, off | 
|  | #endif | 
|  |  | 
|  | #ifndef cfi_restore | 
|  | # define cfi_restore(reg)	.cfi_restore reg | 
|  | #endif | 
|  |  | 
|  | #ifndef cfi_adjust_cfa_offset | 
|  | # define cfi_adjust_cfa_offset(off)	.cfi_adjust_cfa_offset off | 
|  | #endif | 
|  |  | 
|  | #ifndef ENTRY | 
|  | # define ENTRY(name)	\ | 
|  | .type name,  @function;	\ | 
|  | .globl name;	\ | 
|  | .p2align 4;	\ | 
|  | name:	\ | 
|  | cfi_startproc | 
|  | #endif | 
|  |  | 
|  | #ifndef END | 
|  | # define END(name)	\ | 
|  | cfi_endproc;	\ | 
|  | .size name,	.-name | 
|  | #endif | 
|  |  | 
|  | #define CFI_PUSH(REG)	\ | 
|  | cfi_adjust_cfa_offset (4);	\ | 
|  | cfi_rel_offset (REG, 0) | 
|  |  | 
|  | #define CFI_POP(REG)	\ | 
|  | cfi_adjust_cfa_offset (-4);	\ | 
|  | cfi_restore (REG) | 
|  |  | 
|  | #define PUSH(REG)	pushl REG;	CFI_PUSH (REG) | 
|  | #define POP(REG)	popl REG;	CFI_POP (REG) | 
|  |  | 
|  | #define PARMS	8 | 
|  | #define ENTRANCE	PUSH(%edi) | 
|  | #define RETURN	POP (%edi); ret; CFI_PUSH (%edi); | 
|  |  | 
|  |  | 
|  | #define STR1	PARMS | 
|  | #define STR2	STR1+4 | 
|  |  | 
|  | .text | 
|  | ENTRY (strchr) | 
|  |  | 
|  | ENTRANCE | 
|  | mov	STR1(%esp), %ecx | 
|  | movd	STR2(%esp), %xmm1 | 
|  |  | 
|  | pxor	%xmm2, %xmm2 | 
|  | mov	%ecx, %edi | 
|  | punpcklbw %xmm1, %xmm1 | 
|  | punpcklbw %xmm1, %xmm1 | 
|  | /* ECX has OFFSET. */ | 
|  | and	$15, %ecx | 
|  | pshufd	$0, %xmm1, %xmm1 | 
|  | je	L(loop) | 
|  |  | 
|  | /* Handle unaligned string.  */ | 
|  | and	$-16, %edi | 
|  | movdqa	(%edi), %xmm0 | 
|  | pcmpeqb	%xmm0, %xmm2 | 
|  | pcmpeqb	%xmm1, %xmm0 | 
|  | /* Find where NULL is.  */ | 
|  | pmovmskb %xmm2, %edx | 
|  | /* Check if there is a match.  */ | 
|  | pmovmskb %xmm0, %eax | 
|  | /* Remove the leading bytes.  */ | 
|  | sarl	%cl, %edx | 
|  | sarl	%cl, %eax | 
|  | test	%eax, %eax | 
|  | jz	L(unaligned_no_match) | 
|  | add	%ecx, %edi | 
|  | test	%edx, %edx | 
|  | jz	L(match_case1) | 
|  | jmp	L(match_case2) | 
|  |  | 
|  | .p2align 4 | 
|  | L(unaligned_no_match): | 
|  | test	%edx, %edx | 
|  | jne	L(return_null) | 
|  |  | 
|  | pxor	%xmm2, %xmm2 | 
|  | add	$16, %edi | 
|  |  | 
|  | .p2align 4 | 
|  | /* Loop start on aligned string.  */ | 
|  | L(loop): | 
|  | movdqa	(%edi), %xmm0 | 
|  | pcmpeqb	%xmm0, %xmm2 | 
|  | pcmpeqb	%xmm1, %xmm0 | 
|  | pmovmskb %xmm2, %edx | 
|  | pmovmskb %xmm0, %eax | 
|  | test	%eax, %eax | 
|  | jnz	L(matches) | 
|  | test	%edx, %edx | 
|  | jnz	L(return_null) | 
|  | add	$16, %edi | 
|  |  | 
|  | movdqa	(%edi), %xmm0 | 
|  | pcmpeqb	%xmm0, %xmm2 | 
|  | pcmpeqb	%xmm1, %xmm0 | 
|  | pmovmskb %xmm2, %edx | 
|  | pmovmskb %xmm0, %eax | 
|  | test	%eax, %eax | 
|  | jnz	L(matches) | 
|  | test	%edx, %edx | 
|  | jnz	L(return_null) | 
|  | add	$16, %edi | 
|  |  | 
|  | movdqa	(%edi), %xmm0 | 
|  | pcmpeqb	%xmm0, %xmm2 | 
|  | pcmpeqb	%xmm1, %xmm0 | 
|  | pmovmskb %xmm2, %edx | 
|  | pmovmskb %xmm0, %eax | 
|  | test	%eax, %eax | 
|  | jnz	L(matches) | 
|  | test	%edx, %edx | 
|  | jnz	L(return_null) | 
|  | add	$16, %edi | 
|  |  | 
|  | movdqa	(%edi), %xmm0 | 
|  | pcmpeqb	%xmm0, %xmm2 | 
|  | pcmpeqb	%xmm1, %xmm0 | 
|  | pmovmskb %xmm2, %edx | 
|  | pmovmskb %xmm0, %eax | 
|  | test	%eax, %eax | 
|  | jnz	L(matches) | 
|  | test	%edx, %edx | 
|  | jnz	L(return_null) | 
|  | add	$16, %edi | 
|  | jmp	L(loop) | 
|  |  | 
|  | L(matches): | 
|  | /* There is a match.  First find where NULL is.  */ | 
|  | test	%edx, %edx | 
|  | jz	L(match_case1) | 
|  |  | 
|  | .p2align 4 | 
|  | L(match_case2): | 
|  | test	%al, %al | 
|  | jz	L(match_higth_case2) | 
|  |  | 
|  | mov	%al, %cl | 
|  | and	$15, %cl | 
|  | jnz	L(match_case2_4) | 
|  |  | 
|  | mov	%dl, %ch | 
|  | and	$15, %ch | 
|  | jnz	L(return_null) | 
|  |  | 
|  | test	$0x10, %al | 
|  | jnz	L(Exit5) | 
|  | test	$0x10, %dl | 
|  | jnz	L(return_null) | 
|  | test	$0x20, %al | 
|  | jnz	L(Exit6) | 
|  | test	$0x20, %dl | 
|  | jnz	L(return_null) | 
|  | test	$0x40, %al | 
|  | jnz	L(Exit7) | 
|  | test	$0x40, %dl | 
|  | jnz	L(return_null) | 
|  | lea	7(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(match_case2_4): | 
|  | test	$0x01, %al | 
|  | jnz	L(Exit1) | 
|  | test	$0x01, %dl | 
|  | jnz	L(return_null) | 
|  | test	$0x02, %al | 
|  | jnz	L(Exit2) | 
|  | test	$0x02, %dl | 
|  | jnz	L(return_null) | 
|  | test	$0x04, %al | 
|  | jnz	L(Exit3) | 
|  | test	$0x04, %dl | 
|  | jnz	L(return_null) | 
|  | lea	3(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(match_higth_case2): | 
|  | test	%dl, %dl | 
|  | jnz	L(return_null) | 
|  |  | 
|  | mov	%ah, %cl | 
|  | and	$15, %cl | 
|  | jnz	L(match_case2_12) | 
|  |  | 
|  | mov	%dh, %ch | 
|  | and	$15, %ch | 
|  | jnz	L(return_null) | 
|  |  | 
|  | test	$0x10, %ah | 
|  | jnz	L(Exit13) | 
|  | test	$0x10, %dh | 
|  | jnz	L(return_null) | 
|  | test	$0x20, %ah | 
|  | jnz	L(Exit14) | 
|  | test	$0x20, %dh | 
|  | jnz	L(return_null) | 
|  | test	$0x40, %ah | 
|  | jnz	L(Exit15) | 
|  | test	$0x40, %dh | 
|  | jnz	L(return_null) | 
|  | lea	15(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(match_case2_12): | 
|  | test	$0x01, %ah | 
|  | jnz	L(Exit9) | 
|  | test	$0x01, %dh | 
|  | jnz	L(return_null) | 
|  | test	$0x02, %ah | 
|  | jnz	L(Exit10) | 
|  | test	$0x02, %dh | 
|  | jnz	L(return_null) | 
|  | test	$0x04, %ah | 
|  | jnz	L(Exit11) | 
|  | test	$0x04, %dh | 
|  | jnz	L(return_null) | 
|  | lea	11(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(match_case1): | 
|  | test	%al, %al | 
|  | jz	L(match_higth_case1) | 
|  |  | 
|  | test	$0x01, %al | 
|  | jnz	L(Exit1) | 
|  | test	$0x02, %al | 
|  | jnz	L(Exit2) | 
|  | test	$0x04, %al | 
|  | jnz	L(Exit3) | 
|  | test	$0x08, %al | 
|  | jnz	L(Exit4) | 
|  | test	$0x10, %al | 
|  | jnz	L(Exit5) | 
|  | test	$0x20, %al | 
|  | jnz	L(Exit6) | 
|  | test	$0x40, %al | 
|  | jnz	L(Exit7) | 
|  | lea	7(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(match_higth_case1): | 
|  | test	$0x01, %ah | 
|  | jnz	L(Exit9) | 
|  | test	$0x02, %ah | 
|  | jnz	L(Exit10) | 
|  | test	$0x04, %ah | 
|  | jnz	L(Exit11) | 
|  | test	$0x08, %ah | 
|  | jnz	L(Exit12) | 
|  | test	$0x10, %ah | 
|  | jnz	L(Exit13) | 
|  | test	$0x20, %ah | 
|  | jnz	L(Exit14) | 
|  | test	$0x40, %ah | 
|  | jnz	L(Exit15) | 
|  | lea	15(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit1): | 
|  | lea	(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit2): | 
|  | lea	1(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit3): | 
|  | lea	2(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit4): | 
|  | lea	3(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit5): | 
|  | lea	4(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit6): | 
|  | lea	5(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit7): | 
|  | lea	6(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit9): | 
|  | lea	8(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit10): | 
|  | lea	9(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit11): | 
|  | lea	10(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit12): | 
|  | lea	11(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit13): | 
|  | lea	12(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit14): | 
|  | lea	13(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(Exit15): | 
|  | lea	14(%edi), %eax | 
|  | RETURN | 
|  |  | 
|  | .p2align 4 | 
|  | L(return_null): | 
|  | xor	%eax, %eax | 
|  | RETURN | 
|  |  | 
|  | END (strchr) |