diff options
author | H.J. Lu <hjl.tools@gmail.com> | 2015-08-23 12:47:24 -0700 |
---|---|---|
committer | H.J. Lu <hjl.tools@gmail.com> | 2015-08-27 09:35:11 -0700 |
commit | eafb1c2a37d1886de47e7fa757f869c4daf5a491 (patch) | |
tree | ef42196fb03056c7e69ef6fccb9fbb93c3bec3da /sysdeps/i386/i686/multiarch | |
parent | d5496eb9a14df0fe463c211f5fe05cc73e8e770c (diff) | |
download | glibc-eafb1c2a37d1886de47e7fa757f869c4daf5a491.tar.gz glibc-eafb1c2a37d1886de47e7fa757f869c4daf5a491.tar.xz glibc-eafb1c2a37d1886de47e7fa757f869c4daf5a491.zip |
Add i386 strchr multiarch functions
Diffstat (limited to 'sysdeps/i386/i686/multiarch')
-rw-r--r-- | sysdeps/i386/i686/multiarch/Makefile | 2 | ||||
-rw-r--r-- | sysdeps/i386/i686/multiarch/strchr-i586.S | 1 | ||||
-rw-r--r-- | sysdeps/i386/i686/multiarch/strchr-sse2-bsf.S | 158 | ||||
-rw-r--r-- | sysdeps/i386/i686/multiarch/strchr-sse2.S | 348 | ||||
-rw-r--r-- | sysdeps/i386/i686/multiarch/strchr.S | 57 |
5 files changed, 2 insertions, 564 deletions
diff --git a/sysdeps/i386/i686/multiarch/Makefile b/sysdeps/i386/i686/multiarch/Makefile index 830c77d951..788dccb2c9 100644 --- a/sysdeps/i386/i686/multiarch/Makefile +++ b/sysdeps/i386/i686/multiarch/Makefile @@ -1,7 +1,7 @@ ifeq ($(subdir),string) sysdep_routines += varshift \ strlen-sse2 strlen-sse2-bsf \ - strchr-sse2 strrchr-sse2 strchr-sse2-bsf strrchr-sse2-bsf \ + strrchr-sse2 strrchr-sse2-bsf \ strnlen-sse2 strnlen-c ifeq (yes,$(config-cflags-sse4)) sysdep_routines += strcspn-c strpbrk-c strspn-c diff --git a/sysdeps/i386/i686/multiarch/strchr-i586.S b/sysdeps/i386/i686/multiarch/strchr-i586.S new file mode 100644 index 0000000000..9d841c9fd1 --- /dev/null +++ b/sysdeps/i386/i686/multiarch/strchr-i586.S @@ -0,0 +1 @@ +/* Dummy file. */ diff --git a/sysdeps/i386/i686/multiarch/strchr-sse2-bsf.S b/sysdeps/i386/i686/multiarch/strchr-sse2-bsf.S deleted file mode 100644 index ba2723bb51..0000000000 --- a/sysdeps/i386/i686/multiarch/strchr-sse2-bsf.S +++ /dev/null @@ -1,158 +0,0 @@ -/* strchr with SSE2 with bsf - Copyright (C) 2011-2015 Free Software Foundation, Inc. - Contributed by Intel Corporation. - This file is part of the GNU C Library. - - The GNU C Library is free software; you can redistribute it and/or - modify it under the terms of the GNU Lesser General Public - License as published by the Free Software Foundation; either - version 2.1 of the License, or (at your option) any later version. - - The GNU C Library is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU - Lesser General Public License for more details. - - You should have received a copy of the GNU Lesser General Public - License along with the GNU C Library; if not, see - <http://www.gnu.org/licenses/>. */ - -#if IS_IN (libc) - -# include <sysdep.h> - -# define CFI_PUSH(REG) \ - cfi_adjust_cfa_offset (4); \ - cfi_rel_offset (REG, 0) - -# define CFI_POP(REG) \ - cfi_adjust_cfa_offset (-4); \ - cfi_restore (REG) - -# define PUSH(REG) pushl REG; CFI_PUSH (REG) -# define POP(REG) popl REG; CFI_POP (REG) - -# define PARMS 8 -# define ENTRANCE PUSH(%edi) -# define RETURN POP(%edi); ret; CFI_PUSH(%edi); - -# define STR1 PARMS -# define STR2 STR1+4 - - .text -ENTRY (__strchr_sse2_bsf) - - ENTRANCE - mov STR1(%esp), %ecx - movd STR2(%esp), %xmm1 - - pxor %xmm2, %xmm2 - mov %ecx, %edi - punpcklbw %xmm1, %xmm1 - punpcklbw %xmm1, %xmm1 - /* ECX has OFFSET. */ - and $15, %ecx - pshufd $0, %xmm1, %xmm1 - je L(loop) - -/* Handle unaligned string. */ - and $-16, %edi - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - pcmpeqb %xmm1, %xmm0 - /* Find where NULL is. */ - pmovmskb %xmm2, %edx - /* Check if there is a match. */ - pmovmskb %xmm0, %eax - /* Remove the leading bytes. */ - sarl %cl, %edx - sarl %cl, %eax - test %eax, %eax - je L(unaligned_no_match) - /* Check which byte is a match. */ - bsf %eax, %eax - /* Is there a NULL? */ - test %edx, %edx - je L(unaligned_match) - bsf %edx, %edx - cmpl %edx, %eax - /* Return NULL if NULL comes first. */ - ja L(return_null) -L(unaligned_match): - add %edi, %eax - add %ecx, %eax - RETURN - - .p2align 4 -L(unaligned_no_match): - test %edx, %edx - jne L(return_null) - pxor %xmm2, %xmm2 - - add $16, %edi - - .p2align 4 -/* Loop start on aligned string. */ -L(loop): - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - add $16, %edi - pcmpeqb %xmm1, %xmm0 - pmovmskb %xmm2, %edx - pmovmskb %xmm0, %eax - or %eax, %edx - jnz L(matches) - - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - add $16, %edi - pcmpeqb %xmm1, %xmm0 - pmovmskb %xmm2, %edx - pmovmskb %xmm0, %eax - or %eax, %edx - jnz L(matches) - - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - add $16, %edi - pcmpeqb %xmm1, %xmm0 - pmovmskb %xmm2, %edx - pmovmskb %xmm0, %eax - or %eax, %edx - jnz L(matches) - - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - add $16, %edi - pcmpeqb %xmm1, %xmm0 - pmovmskb %xmm2, %edx - pmovmskb %xmm0, %eax - or %eax, %edx - jnz L(matches) - jmp L(loop) - -L(matches): - pmovmskb %xmm2, %edx - test %eax, %eax - jz L(return_null) - bsf %eax, %eax - /* There is a match. First find where NULL is. */ - test %edx, %edx - je L(match) - bsf %edx, %ecx - /* Check if NULL comes first. */ - cmpl %ecx, %eax - ja L(return_null) -L(match): - sub $16, %edi - add %edi, %eax - RETURN - -/* Return NULL. */ - .p2align 4 -L(return_null): - xor %eax, %eax - RETURN - -END (__strchr_sse2_bsf) -#endif diff --git a/sysdeps/i386/i686/multiarch/strchr-sse2.S b/sysdeps/i386/i686/multiarch/strchr-sse2.S deleted file mode 100644 index 4f387eaeea..0000000000 --- a/sysdeps/i386/i686/multiarch/strchr-sse2.S +++ /dev/null @@ -1,348 +0,0 @@ -/* strchr SSE2 without bsf - Copyright (C) 2011-2015 Free Software Foundation, Inc. - Contributed by Intel Corporation. - This file is part of the GNU C Library. - - The GNU C Library is free software; you can redistribute it and/or - modify it under the terms of the GNU Lesser General Public - License as published by the Free Software Foundation; either - version 2.1 of the License, or (at your option) any later version. - - The GNU C Library is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU - Lesser General Public License for more details. - - You should have received a copy of the GNU Lesser General Public - License along with the GNU C Library; if not, see - <http://www.gnu.org/licenses/>. */ - -#if IS_IN (libc) - -# include <sysdep.h> - -# define CFI_PUSH(REG) \ - cfi_adjust_cfa_offset (4); \ - cfi_rel_offset (REG, 0) - -# define CFI_POP(REG) \ - cfi_adjust_cfa_offset (-4); \ - cfi_restore (REG) - -# define PUSH(REG) pushl REG; CFI_PUSH (REG) -# define POP(REG) popl REG; CFI_POP (REG) - -# define PARMS 8 -# define ENTRANCE PUSH(%edi) -# define RETURN POP(%edi); ret; CFI_PUSH(%edi); - -# define STR1 PARMS -# define STR2 STR1+4 - - atom_text_section -ENTRY (__strchr_sse2) - - ENTRANCE - mov STR1(%esp), %ecx - movd STR2(%esp), %xmm1 - - pxor %xmm2, %xmm2 - mov %ecx, %edi - punpcklbw %xmm1, %xmm1 - punpcklbw %xmm1, %xmm1 - /* ECX has OFFSET. */ - and $15, %ecx - pshufd $0, %xmm1, %xmm1 - je L(loop) - -/* Handle unaligned string. */ - and $-16, %edi - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - pcmpeqb %xmm1, %xmm0 - /* Find where NULL is. */ - pmovmskb %xmm2, %edx - /* Check if there is a match. */ - pmovmskb %xmm0, %eax - /* Remove the leading bytes. */ - sarl %cl, %edx - sarl %cl, %eax - test %eax, %eax - jz L(unaligned_no_match) - /* Check which byte is a match. */ - /* Is there a NULL? */ - add %ecx, %edi - test %edx, %edx - jz L(match_case1) - jmp L(match_case2) - - .p2align 4 -L(unaligned_no_match): - test %edx, %edx - jne L(return_null) - - pxor %xmm2, %xmm2 - add $16, %edi - - .p2align 4 -/* Loop start on aligned string. */ -L(loop): - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - pcmpeqb %xmm1, %xmm0 - pmovmskb %xmm2, %edx - pmovmskb %xmm0, %eax - test %eax, %eax - jnz L(matches) - test %edx, %edx - jnz L(return_null) - add $16, %edi - - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - pcmpeqb %xmm1, %xmm0 - pmovmskb %xmm2, %edx - pmovmskb %xmm0, %eax - test %eax, %eax - jnz L(matches) - test %edx, %edx - jnz L(return_null) - add $16, %edi - - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - pcmpeqb %xmm1, %xmm0 - pmovmskb %xmm2, %edx - pmovmskb %xmm0, %eax - test %eax, %eax - jnz L(matches) - test %edx, %edx - jnz L(return_null) - add $16, %edi - - movdqa (%edi), %xmm0 - pcmpeqb %xmm0, %xmm2 - pcmpeqb %xmm1, %xmm0 - pmovmskb %xmm2, %edx - pmovmskb %xmm0, %eax - test %eax, %eax - jnz L(matches) - test %edx, %edx - jnz L(return_null) - add $16, %edi - jmp L(loop) - -L(matches): - /* There is a match. First find where NULL is. */ - test %edx, %edx - jz L(match_case1) - - .p2align 4 -L(match_case2): - test %al, %al - jz L(match_higth_case2) - - mov %al, %cl - and $15, %cl - jnz L(match_case2_4) - - mov %dl, %ch - and $15, %ch - jnz L(return_null) - - test $0x10, %al - jnz L(Exit5) - test $0x10, %dl - jnz L(return_null) - test $0x20, %al - jnz L(Exit6) - test $0x20, %dl - jnz L(return_null) - test $0x40, %al - jnz L(Exit7) - test $0x40, %dl - jnz L(return_null) - lea 7(%edi), %eax - RETURN - - .p2align 4 -L(match_case2_4): - test $0x01, %al - jnz L(Exit1) - test $0x01, %dl - jnz L(return_null) - test $0x02, %al - jnz L(Exit2) - test $0x02, %dl - jnz L(return_null) - test $0x04, %al - jnz L(Exit3) - test $0x04, %dl - jnz L(return_null) - lea 3(%edi), %eax - RETURN - - .p2align 4 -L(match_higth_case2): - test %dl, %dl - jnz L(return_null) - - mov %ah, %cl - and $15, %cl - jnz L(match_case2_12) - - mov %dh, %ch - and $15, %ch - jnz L(return_null) - - test $0x10, %ah - jnz L(Exit13) - test $0x10, %dh - jnz L(return_null) - test $0x20, %ah - jnz L(Exit14) - test $0x20, %dh - jnz L(return_null) - test $0x40, %ah - jnz L(Exit15) - test $0x40, %dh - jnz L(return_null) - lea 15(%edi), %eax - RETURN - - .p2align 4 -L(match_case2_12): - test $0x01, %ah - jnz L(Exit9) - test $0x01, %dh - jnz L(return_null) - test $0x02, %ah - jnz L(Exit10) - test $0x02, %dh - jnz L(return_null) - test $0x04, %ah - jnz L(Exit11) - test $0x04, %dh - jnz L(return_null) - lea 11(%edi), %eax - RETURN - - .p2align 4 -L(match_case1): - test %al, %al - jz L(match_higth_case1) - - test $0x01, %al - jnz L(Exit1) - test $0x02, %al - jnz L(Exit2) - test $0x04, %al - jnz L(Exit3) - test $0x08, %al - jnz L(Exit4) - test $0x10, %al - jnz L(Exit5) - test $0x20, %al - jnz L(Exit6) - test $0x40, %al - jnz L(Exit7) - lea 7(%edi), %eax - RETURN - - .p2align 4 -L(match_higth_case1): - test $0x01, %ah - jnz L(Exit9) - test $0x02, %ah - jnz L(Exit10) - test $0x04, %ah - jnz L(Exit11) - test $0x08, %ah - jnz L(Exit12) - test $0x10, %ah - jnz L(Exit13) - test $0x20, %ah - jnz L(Exit14) - test $0x40, %ah - jnz L(Exit15) - lea 15(%edi), %eax - RETURN - - .p2align 4 -L(Exit1): - lea (%edi), %eax - RETURN - - .p2align 4 -L(Exit2): - lea 1(%edi), %eax - RETURN - - .p2align 4 -L(Exit3): - lea 2(%edi), %eax - RETURN - - .p2align 4 -L(Exit4): - lea 3(%edi), %eax - RETURN - - .p2align 4 -L(Exit5): - lea 4(%edi), %eax - RETURN - - .p2align 4 -L(Exit6): - lea 5(%edi), %eax - RETURN - - .p2align 4 -L(Exit7): - lea 6(%edi), %eax - RETURN - - .p2align 4 -L(Exit9): - lea 8(%edi), %eax - RETURN - - .p2align 4 -L(Exit10): - lea 9(%edi), %eax - RETURN - - .p2align 4 -L(Exit11): - lea 10(%edi), %eax - RETURN - - .p2align 4 -L(Exit12): - lea 11(%edi), %eax - RETURN - - .p2align 4 -L(Exit13): - lea 12(%edi), %eax - RETURN - - .p2align 4 -L(Exit14): - lea 13(%edi), %eax - RETURN - - .p2align 4 -L(Exit15): - lea 14(%edi), %eax - RETURN - -/* Return NULL. */ - .p2align 4 -L(return_null): - xor %eax, %eax - RETURN - -END (__strchr_sse2) -#endif diff --git a/sysdeps/i386/i686/multiarch/strchr.S b/sysdeps/i386/i686/multiarch/strchr.S deleted file mode 100644 index 6b4656582a..0000000000 --- a/sysdeps/i386/i686/multiarch/strchr.S +++ /dev/null @@ -1,57 +0,0 @@ -/* Multiple versions of strchr - All versions must be listed in ifunc-impl-list.c. - Copyright (C) 2011-2015 Free Software Foundation, Inc. - Contributed by Intel Corporation. - This file is part of the GNU C Library. - - The GNU C Library is free software; you can redistribute it and/or - modify it under the terms of the GNU Lesser General Public - License as published by the Free Software Foundation; either - version 2.1 of the License, or (at your option) any later version. - - The GNU C Library is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU - Lesser General Public License for more details. - - You should have received a copy of the GNU Lesser General Public - License along with the GNU C Library; if not, see - <http://www.gnu.org/licenses/>. */ - -#include <sysdep.h> -#include <init-arch.h> - -#if IS_IN (libc) - .text -ENTRY(strchr) - .type strchr, @gnu_indirect_function - LOAD_GOT_AND_RTLD_GLOBAL_RO - LOAD_FUNC_GOT_EAX (__strchr_ia32) - HAS_CPU_FEATURE (SSE2) - jz 2f - LOAD_FUNC_GOT_EAX (__strchr_sse2_bsf) - HAS_ARCH_FEATURE (Slow_BSF) - jz 2f - LOAD_FUNC_GOT_EAX (__strchr_sse2) -2: ret -END(strchr) - -# undef ENTRY -# define ENTRY(name) \ - .type __strchr_ia32, @function; \ - .globl __strchr_ia32; \ - .p2align 4; \ - __strchr_ia32: cfi_startproc; \ - CALL_MCOUNT -# undef END -# define END(name) \ - cfi_endproc; .size __strchr_ia32, .-__strchr_ia32 -# undef libc_hidden_builtin_def -/* IFUNC doesn't work with the hidden functions in shared library since - they will be called without setting up EBX needed for PLT which is - used by IFUNC. */ -# define libc_hidden_builtin_def(name) \ - .globl __GI_strchr; __GI_strchr = __strchr_ia32 -#endif - -#include "../../i586/strchr.S" |