Blame sysdeps/x86_64/multiarch/strchr-sse2-no-bsf.S

Packit 6c4009
/* strchr with SSE2 without bsf
Packit 6c4009
   Copyright (C) 2011-2018 Free Software Foundation, Inc.
Packit 6c4009
   Contributed by Intel Corporation.
Packit 6c4009
   This file is part of the GNU C Library.
Packit 6c4009
Packit 6c4009
   The GNU C Library is free software; you can redistribute it and/or
Packit 6c4009
   modify it under the terms of the GNU Lesser General Public
Packit 6c4009
   License as published by the Free Software Foundation; either
Packit 6c4009
   version 2.1 of the License, or (at your option) any later version.
Packit 6c4009
Packit 6c4009
   The GNU C Library is distributed in the hope that it will be useful,
Packit 6c4009
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 6c4009
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 6c4009
   Lesser General Public License for more details.
Packit 6c4009
Packit 6c4009
   You should have received a copy of the GNU Lesser General Public
Packit 6c4009
   License along with the GNU C Library; if not, see
Packit 6c4009
   <http://www.gnu.org/licenses/>.  */
Packit 6c4009
Packit 6c4009
#if IS_IN (libc)
Packit 6c4009
Packit 6c4009
# include <sysdep.h>
Packit 6c4009
# include "asm-syntax.h"
Packit 6c4009
Packit 6c4009
	atom_text_section
Packit 6c4009
ENTRY (__strchr_sse2_no_bsf)
Packit 6c4009
	movd	%esi, %xmm1
Packit 6c4009
	movq	%rdi, %rcx
Packit 6c4009
	punpcklbw %xmm1, %xmm1
Packit 6c4009
	andq	$~15, %rdi
Packit 6c4009
	pxor	%xmm2, %xmm2
Packit 6c4009
	punpcklbw %xmm1, %xmm1
Packit 6c4009
	orl	$0xffffffff, %esi
Packit 6c4009
	movdqa	(%rdi), %xmm0
Packit 6c4009
	pshufd	$0, %xmm1, %xmm1
Packit 6c4009
	subq	%rdi, %rcx
Packit 6c4009
	movdqa	%xmm0, %xmm3
Packit 6c4009
	leaq	16(%rdi), %rdi
Packit 6c4009
	pcmpeqb	%xmm1, %xmm0
Packit 6c4009
	pcmpeqb	%xmm2, %xmm3
Packit 6c4009
	shl	%cl, %esi
Packit 6c4009
	pmovmskb %xmm0, %eax
Packit 6c4009
	pmovmskb %xmm3, %edx
Packit 6c4009
	andl	%esi, %eax
Packit 6c4009
	andl	%esi, %edx
Packit 6c4009
	test	%eax, %eax
Packit 6c4009
	jnz	L(matches)
Packit 6c4009
	test	%edx, %edx
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
Packit 6c4009
L(loop):
Packit 6c4009
	movdqa	(%rdi), %xmm0
Packit 6c4009
	leaq	16(%rdi), %rdi
Packit 6c4009
	movdqa	%xmm0, %xmm3
Packit 6c4009
	pcmpeqb	%xmm1, %xmm0
Packit 6c4009
	pcmpeqb	%xmm2, %xmm3
Packit 6c4009
	pmovmskb %xmm0, %eax
Packit 6c4009
	pmovmskb %xmm3, %edx
Packit 6c4009
	or	%eax, %edx
Packit 6c4009
	jz	L(loop)
Packit 6c4009
Packit 6c4009
	pmovmskb %xmm3, %edx
Packit 6c4009
	test	%eax, %eax
Packit 6c4009
	jnz	L(matches)
Packit 6c4009
Packit 6c4009
/* Return NULL.  */
Packit 6c4009
	.p2align 4
Packit 6c4009
L(return_null):
Packit 6c4009
	xor	%rax, %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
L(matches):
Packit 6c4009
	/* There is a match.  First find where NULL is.  */
Packit 6c4009
	leaq	-16(%rdi), %rdi
Packit 6c4009
	test	%edx, %edx
Packit 6c4009
	jz	L(match_case1)
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(match_case2):
Packit 6c4009
	test	%al, %al
Packit 6c4009
	jz	L(match_high_case2)
Packit 6c4009
Packit 6c4009
	mov	%al, %cl
Packit 6c4009
	and	$15, %cl
Packit 6c4009
	jnz	L(match_case2_4)
Packit 6c4009
Packit 6c4009
	mov	%dl, %ch
Packit 6c4009
	and	$15, %ch
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
Packit 6c4009
	test	$0x10, %al
Packit 6c4009
	jnz	L(Exit5)
Packit 6c4009
	test	$0x10, %dl
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	test	$0x20, %al
Packit 6c4009
	jnz	L(Exit6)
Packit 6c4009
	test	$0x20, %dl
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	test	$0x40, %al
Packit 6c4009
	jnz	L(Exit7)
Packit 6c4009
	test	$0x40, %dl
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	lea	7(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(match_case2_4):
Packit 6c4009
	test	$0x01, %al
Packit 6c4009
	jnz	L(Exit1)
Packit 6c4009
	test	$0x01, %dl
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	test	$0x02, %al
Packit 6c4009
	jnz	L(Exit2)
Packit 6c4009
	test	$0x02, %dl
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	test	$0x04, %al
Packit 6c4009
	jnz	L(Exit3)
Packit 6c4009
	test	$0x04, %dl
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	lea	3(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(match_high_case2):
Packit 6c4009
	test	%dl, %dl
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
Packit 6c4009
	mov	%ah, %cl
Packit 6c4009
	and	$15, %cl
Packit 6c4009
	jnz	L(match_case2_12)
Packit 6c4009
Packit 6c4009
	mov	%dh, %ch
Packit 6c4009
	and	$15, %ch
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
Packit 6c4009
	test	$0x10, %ah
Packit 6c4009
	jnz	L(Exit13)
Packit 6c4009
	test	$0x10, %dh
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	test	$0x20, %ah
Packit 6c4009
	jnz	L(Exit14)
Packit 6c4009
	test	$0x20, %dh
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	test	$0x40, %ah
Packit 6c4009
	jnz	L(Exit15)
Packit 6c4009
	test	$0x40, %dh
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	lea	15(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(match_case2_12):
Packit 6c4009
	test	$0x01, %ah
Packit 6c4009
	jnz	L(Exit9)
Packit 6c4009
	test	$0x01, %dh
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	test	$0x02, %ah
Packit 6c4009
	jnz	L(Exit10)
Packit 6c4009
	test	$0x02, %dh
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	test	$0x04, %ah
Packit 6c4009
	jnz	L(Exit11)
Packit 6c4009
	test	$0x04, %dh
Packit 6c4009
	jnz	L(return_null)
Packit 6c4009
	lea	11(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(match_case1):
Packit 6c4009
	test	%al, %al
Packit 6c4009
	jz	L(match_high_case1)
Packit 6c4009
Packit 6c4009
	test	$0x01, %al
Packit 6c4009
	jnz	L(Exit1)
Packit 6c4009
	test	$0x02, %al
Packit 6c4009
	jnz	L(Exit2)
Packit 6c4009
	test	$0x04, %al
Packit 6c4009
	jnz	L(Exit3)
Packit 6c4009
	test	$0x08, %al
Packit 6c4009
	jnz	L(Exit4)
Packit 6c4009
	test	$0x10, %al
Packit 6c4009
	jnz	L(Exit5)
Packit 6c4009
	test	$0x20, %al
Packit 6c4009
	jnz	L(Exit6)
Packit 6c4009
	test	$0x40, %al
Packit 6c4009
	jnz	L(Exit7)
Packit 6c4009
	lea	7(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(match_high_case1):
Packit 6c4009
	test	$0x01, %ah
Packit 6c4009
	jnz	L(Exit9)
Packit 6c4009
	test	$0x02, %ah
Packit 6c4009
	jnz	L(Exit10)
Packit 6c4009
	test	$0x04, %ah
Packit 6c4009
	jnz	L(Exit11)
Packit 6c4009
	test	$0x08, %ah
Packit 6c4009
	jnz	L(Exit12)
Packit 6c4009
	test	$0x10, %ah
Packit 6c4009
	jnz	L(Exit13)
Packit 6c4009
	test	$0x20, %ah
Packit 6c4009
	jnz	L(Exit14)
Packit 6c4009
	test	$0x40, %ah
Packit 6c4009
	jnz	L(Exit15)
Packit 6c4009
	lea	15(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit1):
Packit 6c4009
	lea	(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit2):
Packit 6c4009
	lea	1(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit3):
Packit 6c4009
	lea	2(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit4):
Packit 6c4009
	lea	3(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit5):
Packit 6c4009
	lea	4(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit6):
Packit 6c4009
	lea	5(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit7):
Packit 6c4009
	lea	6(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit9):
Packit 6c4009
	lea	8(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit10):
Packit 6c4009
	lea	9(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit11):
Packit 6c4009
	lea	10(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit12):
Packit 6c4009
	lea	11(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit13):
Packit 6c4009
	lea	12(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit14):
Packit 6c4009
	lea	13(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
	.p2align 4
Packit 6c4009
L(Exit15):
Packit 6c4009
	lea	14(%rdi), %rax
Packit 6c4009
	ret
Packit 6c4009
Packit 6c4009
END (__strchr_sse2_no_bsf)
Packit 6c4009
#endif