diff options
Diffstat (limited to 'sysdeps/i386/i686')
-rw-r--r-- | sysdeps/i386/i686/multiarch/Makefile | 2 | ||||
-rw-r--r-- | sysdeps/i386/i686/multiarch/wcscmp-c.c | 14 | ||||
-rw-r--r-- | sysdeps/i386/i686/multiarch/wcscmp-sse2.S | 1018 | ||||
-rw-r--r-- | sysdeps/i386/i686/multiarch/wcscmp.S | 39 |
4 files changed, 1 insertions, 1072 deletions
diff --git a/sysdeps/i386/i686/multiarch/Makefile b/sysdeps/i386/i686/multiarch/Makefile index 289f0f9634..a9d032f106 100644 --- a/sysdeps/i386/i686/multiarch/Makefile +++ b/sysdeps/i386/i686/multiarch/Makefile @@ -1,5 +1,5 @@ ifeq ($(subdir),wcsmbs) -sysdep_routines += wcscmp-sse2 wcscmp-c wcslen-sse2 wcslen-c \ +sysdep_routines += wcslen-sse2 wcslen-c \ wmemcmp-sse4 wmemcmp-ssse3 wmemcmp-c \ wcscpy-ssse3 wcscpy-c endif diff --git a/sysdeps/i386/i686/multiarch/wcscmp-c.c b/sysdeps/i386/i686/multiarch/wcscmp-c.c deleted file mode 100644 index e3337d77e2..0000000000 --- a/sysdeps/i386/i686/multiarch/wcscmp-c.c +++ /dev/null @@ -1,14 +0,0 @@ -#include <wchar.h> - -#define WCSCMP __wcscmp_ia32 -#ifdef SHARED -# undef libc_hidden_def -# define libc_hidden_def(name) \ - __hidden_ver1 (__wcscmp_ia32, __GI___wcscmp, __wcscmp_ia32); -#endif -#undef weak_alias -#define weak_alias(name, alias) - -extern __typeof (wcscmp) __wcscmp_ia32; - -#include "wcsmbs/wcscmp.c" diff --git a/sysdeps/i386/i686/multiarch/wcscmp-sse2.S b/sysdeps/i386/i686/multiarch/wcscmp-sse2.S deleted file mode 100644 index b25103df2d..0000000000 --- a/sysdeps/i386/i686/multiarch/wcscmp-sse2.S +++ /dev/null @@ -1,1018 +0,0 @@ -/* wcscmp with SSE2 - Copyright (C) 2011-2015 Free Software Foundation, Inc. - Contributed by Intel Corporation. - This file is part of the GNU C Library. - - The GNU C Library is free software; you can redistribute it and/or - modify it under the terms of the GNU Lesser General Public - License as published by the Free Software Foundation; either - version 2.1 of the License, or (at your option) any later version. - - The GNU C Library is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU - Lesser General Public License for more details. - - You should have received a copy of the GNU Lesser General Public - License along with the GNU C Library; if not, see - <http://www.gnu.org/licenses/>. */ - -#if IS_IN (libc) - -# include <sysdep.h> - -# define CFI_PUSH(REG) \ - cfi_adjust_cfa_offset (4); \ - cfi_rel_offset (REG, 0) - -# define CFI_POP(REG) \ - cfi_adjust_cfa_offset (-4); \ - cfi_restore (REG) - -# define PUSH(REG) pushl REG; CFI_PUSH (REG) -# define POP(REG) popl REG; CFI_POP (REG) - -# define ENTRANCE PUSH(%esi); PUSH(%edi) -# define RETURN POP(%edi); POP(%esi); ret; CFI_PUSH(%esi); CFI_PUSH(%edi); -# define PARMS 4 -# define STR1 PARMS -# define STR2 STR1+4 - -/* Note: wcscmp uses signed comparison, not unsugned as in strcmp function. */ - - .text -ENTRY (__wcscmp_sse2) -/* - * This implementation uses SSE to compare up to 16 bytes at a time. -*/ - mov STR1(%esp), %edx - mov STR2(%esp), %eax - - mov (%eax), %ecx - cmp %ecx, (%edx) - jne L(neq) - test %ecx, %ecx - jz L(eq) - - mov 4(%eax), %ecx - cmp %ecx, 4(%edx) - jne L(neq) - test %ecx, %ecx - jz L(eq) - - mov 8(%eax), %ecx - cmp %ecx, 8(%edx) - jne L(neq) - test %ecx, %ecx - jz L(eq) - - mov 12(%eax), %ecx - cmp %ecx, 12(%edx) - jne L(neq) - test %ecx, %ecx - jz L(eq) - - ENTRANCE - add $16, %eax - add $16, %edx - - mov %eax, %esi - mov %edx, %edi - pxor %xmm0, %xmm0 /* clear %xmm0 for null char checks */ - mov %al, %ch - mov %dl, %cl - and $63, %eax /* esi alignment in cache line */ - and $63, %edx /* edi alignment in cache line */ - and $15, %cl - jz L(continue_00) - cmp $16, %edx - jb L(continue_0) - cmp $32, %edx - jb L(continue_16) - cmp $48, %edx - jb L(continue_32) - -L(continue_48): - and $15, %ch - jz L(continue_48_00) - cmp $16, %eax - jb L(continue_0_48) - cmp $32, %eax - jb L(continue_16_48) - cmp $48, %eax - jb L(continue_32_48) - - .p2align 4 -L(continue_48_48): - mov (%esi), %ecx - cmp %ecx, (%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 4(%esi), %ecx - cmp %ecx, 4(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 8(%esi), %ecx - cmp %ecx, 8(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 12(%esi), %ecx - cmp %ecx, 12(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - movdqu 16(%edi), %xmm1 - movdqu 16(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - movdqu 32(%edi), %xmm1 - movdqu 32(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - movdqu 48(%edi), %xmm1 - movdqu 48(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_48) - - add $64, %esi - add $64, %edi - jmp L(continue_48_48) - -L(continue_0): - and $15, %ch - jz L(continue_0_00) - cmp $16, %eax - jb L(continue_0_0) - cmp $32, %eax - jb L(continue_0_16) - cmp $48, %eax - jb L(continue_0_32) - - .p2align 4 -L(continue_0_48): - mov (%esi), %ecx - cmp %ecx, (%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 4(%esi), %ecx - cmp %ecx, 4(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 8(%esi), %ecx - cmp %ecx, 8(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 12(%esi), %ecx - cmp %ecx, 12(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - movdqu 16(%edi), %xmm1 - movdqu 16(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - movdqu 32(%edi), %xmm1 - movdqu 32(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - mov 48(%esi), %ecx - cmp %ecx, 48(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 52(%esi), %ecx - cmp %ecx, 52(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 56(%esi), %ecx - cmp %ecx, 56(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 60(%esi), %ecx - cmp %ecx, 60(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - add $64, %esi - add $64, %edi - jmp L(continue_0_48) - - .p2align 4 -L(continue_00): - and $15, %ch - jz L(continue_00_00) - cmp $16, %eax - jb L(continue_00_0) - cmp $32, %eax - jb L(continue_00_16) - cmp $48, %eax - jb L(continue_00_32) - - .p2align 4 -L(continue_00_48): - pcmpeqd (%edi), %xmm0 - mov (%edi), %eax - pmovmskb %xmm0, %ecx - test %ecx, %ecx - jnz L(less4_double_words1) - - cmp (%esi), %eax - jne L(nequal) - - mov 4(%edi), %eax - cmp 4(%esi), %eax - jne L(nequal) - - mov 8(%edi), %eax - cmp 8(%esi), %eax - jne L(nequal) - - mov 12(%edi), %eax - cmp 12(%esi), %eax - jne L(nequal) - - movdqu 16(%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd 16(%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - movdqu 32(%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd 32(%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - movdqu 48(%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd 48(%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_48) - - add $64, %esi - add $64, %edi - jmp L(continue_00_48) - - .p2align 4 -L(continue_32): - and $15, %ch - jz L(continue_32_00) - cmp $16, %eax - jb L(continue_0_32) - cmp $32, %eax - jb L(continue_16_32) - cmp $48, %eax - jb L(continue_32_32) - - .p2align 4 -L(continue_32_48): - mov (%esi), %ecx - cmp %ecx, (%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 4(%esi), %ecx - cmp %ecx, 4(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 8(%esi), %ecx - cmp %ecx, 8(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 12(%esi), %ecx - cmp %ecx, 12(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 16(%esi), %ecx - cmp %ecx, 16(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 20(%esi), %ecx - cmp %ecx, 20(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 24(%esi), %ecx - cmp %ecx, 24(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 28(%esi), %ecx - cmp %ecx, 28(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - movdqu 32(%edi), %xmm1 - movdqu 32(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - movdqu 48(%edi), %xmm1 - movdqu 48(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results */ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_48) - - add $64, %esi - add $64, %edi - jmp L(continue_32_48) - - .p2align 4 -L(continue_16): - and $15, %ch - jz L(continue_16_00) - cmp $16, %eax - jb L(continue_0_16) - cmp $32, %eax - jb L(continue_16_16) - cmp $48, %eax - jb L(continue_16_32) - - .p2align 4 -L(continue_16_48): - mov (%esi), %ecx - cmp %ecx, (%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 4(%esi), %ecx - cmp %ecx, 4(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 8(%esi), %ecx - cmp %ecx, 8(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 12(%esi), %ecx - cmp %ecx, 12(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - movdqu 16(%edi), %xmm1 - movdqu 16(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - mov 32(%esi), %ecx - cmp %ecx, 32(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 36(%esi), %ecx - cmp %ecx, 36(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 40(%esi), %ecx - cmp %ecx, 40(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 44(%esi), %ecx - cmp %ecx, 44(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - movdqu 48(%edi), %xmm1 - movdqu 48(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_48) - - add $64, %esi - add $64, %edi - jmp L(continue_16_48) - - .p2align 4 -L(continue_00_00): - movdqa (%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd (%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - movdqa 16(%edi), %xmm3 - pcmpeqd %xmm3, %xmm0 /* Any null double_word? */ - pcmpeqd 16(%esi), %xmm3 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm3 /* packed sub of comparison results*/ - pmovmskb %xmm3, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - movdqa 32(%edi), %xmm5 - pcmpeqd %xmm5, %xmm0 /* Any null double_word? */ - pcmpeqd 32(%esi), %xmm5 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm5 /* packed sub of comparison results*/ - pmovmskb %xmm5, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - movdqa 48(%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd 48(%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_48) - - add $64, %esi - add $64, %edi - jmp L(continue_00_00) - - .p2align 4 -L(continue_00_32): - movdqu (%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd (%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - add $16, %esi - add $16, %edi - jmp L(continue_00_48) - - .p2align 4 -L(continue_00_16): - movdqu (%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd (%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - movdqu 16(%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd 16(%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - add $32, %esi - add $32, %edi - jmp L(continue_00_48) - - .p2align 4 -L(continue_00_0): - movdqu (%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd (%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - movdqu 16(%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd 16(%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - movdqu 32(%esi), %xmm2 - pcmpeqd %xmm2, %xmm0 /* Any null double_word? */ - pcmpeqd 32(%edi), %xmm2 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm2 /* packed sub of comparison results*/ - pmovmskb %xmm2, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - add $48, %esi - add $48, %edi - jmp L(continue_00_48) - - .p2align 4 -L(continue_48_00): - pcmpeqd (%esi), %xmm0 - mov (%edi), %eax - pmovmskb %xmm0, %ecx - test %ecx, %ecx - jnz L(less4_double_words1) - - cmp (%esi), %eax - jne L(nequal) - - mov 4(%edi), %eax - cmp 4(%esi), %eax - jne L(nequal) - - mov 8(%edi), %eax - cmp 8(%esi), %eax - jne L(nequal) - - mov 12(%edi), %eax - cmp 12(%esi), %eax - jne L(nequal) - - movdqu 16(%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd 16(%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - movdqu 32(%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd 32(%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - movdqu 48(%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd 48(%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_48) - - add $64, %esi - add $64, %edi - jmp L(continue_48_00) - - .p2align 4 -L(continue_32_00): - movdqu (%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd (%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - add $16, %esi - add $16, %edi - jmp L(continue_48_00) - - .p2align 4 -L(continue_16_00): - movdqu (%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd (%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - movdqu 16(%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd 16(%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - add $32, %esi - add $32, %edi - jmp L(continue_48_00) - - .p2align 4 -L(continue_0_00): - movdqu (%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd (%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - movdqu 16(%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd 16(%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - movdqu 32(%edi), %xmm1 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd 32(%esi), %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - add $48, %esi - add $48, %edi - jmp L(continue_48_00) - - .p2align 4 -L(continue_32_32): - movdqu (%edi), %xmm1 - movdqu (%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - add $16, %esi - add $16, %edi - jmp L(continue_48_48) - - .p2align 4 -L(continue_16_16): - movdqu (%edi), %xmm1 - movdqu (%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - movdqu 16(%edi), %xmm3 - movdqu 16(%esi), %xmm4 - pcmpeqd %xmm3, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm4, %xmm3 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm3 /* packed sub of comparison results*/ - pmovmskb %xmm3, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - add $32, %esi - add $32, %edi - jmp L(continue_48_48) - - .p2align 4 -L(continue_0_0): - movdqu (%edi), %xmm1 - movdqu (%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - movdqu 16(%edi), %xmm3 - movdqu 16(%esi), %xmm4 - pcmpeqd %xmm3, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm4, %xmm3 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm3 /* packed sub of comparison results*/ - pmovmskb %xmm3, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - movdqu 32(%edi), %xmm1 - movdqu 32(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_32) - - add $48, %esi - add $48, %edi - jmp L(continue_48_48) - - .p2align 4 -L(continue_0_16): - movdqu (%edi), %xmm1 - movdqu (%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - movdqu 16(%edi), %xmm1 - movdqu 16(%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words_16) - - add $32, %esi - add $32, %edi - jmp L(continue_32_48) - - .p2align 4 -L(continue_0_32): - movdqu (%edi), %xmm1 - movdqu (%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - add $16, %esi - add $16, %edi - jmp L(continue_16_48) - - .p2align 4 -L(continue_16_32): - movdqu (%edi), %xmm1 - movdqu (%esi), %xmm2 - pcmpeqd %xmm1, %xmm0 /* Any null double_word? */ - pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */ - psubb %xmm0, %xmm1 /* packed sub of comparison results*/ - pmovmskb %xmm1, %edx - sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */ - jnz L(less4_double_words) - - add $16, %esi - add $16, %edi - jmp L(continue_32_48) - - .p2align 4 -L(less4_double_words1): - cmp (%esi), %eax - jne L(nequal) - test %eax, %eax - jz L(equal) - - mov 4(%esi), %ecx - cmp %ecx, 4(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 8(%esi), %ecx - cmp %ecx, 8(%edi) - jne L(nequal) - test %ecx, %ecx - jz L(equal) - - mov 12(%esi), %ecx - cmp %ecx, 12(%edi) - jne L(nequal) - xor %eax, %eax - RETURN - - .p2align 4 -L(less4_double_words): - xor %eax, %eax - test %dl, %dl - jz L(next_two_double_words) - and $15, %dl - jz L(second_double_word) - mov (%esi), %ecx - cmp %ecx, (%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(second_double_word): - mov 4(%esi), %ecx - cmp %ecx, 4(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(next_two_double_words): - and $15, %dh - jz L(fourth_double_word) - mov 8(%esi), %ecx - cmp %ecx, 8(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(fourth_double_word): - mov 12(%esi), %ecx - cmp %ecx, 12(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(less4_double_words_16): - xor %eax, %eax - test %dl, %dl - jz L(next_two_double_words_16) - and $15, %dl - jz L(second_double_word_16) - mov 16(%esi), %ecx - cmp %ecx, 16(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(second_double_word_16): - mov 20(%esi), %ecx - cmp %ecx, 20(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(next_two_double_words_16): - and $15, %dh - jz L(fourth_double_word_16) - mov 24(%esi), %ecx - cmp %ecx, 24(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(fourth_double_word_16): - mov 28(%esi), %ecx - cmp %ecx, 28(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(less4_double_words_32): - xor %eax, %eax - test %dl, %dl - jz L(next_two_double_words_32) - and $15, %dl - jz L(second_double_word_32) - mov 32(%esi), %ecx - cmp %ecx, 32(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(second_double_word_32): - mov 36(%esi), %ecx - cmp %ecx, 36(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(next_two_double_words_32): - and $15, %dh - jz L(fourth_double_word_32) - mov 40(%esi), %ecx - cmp %ecx, 40(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(fourth_double_word_32): - mov 44(%esi), %ecx - cmp %ecx, 44(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(less4_double_words_48): - xor %eax, %eax - test %dl, %dl - jz L(next_two_double_words_48) - and $15, %dl - jz L(second_double_word_48) - mov 48(%esi), %ecx - cmp %ecx, 48(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(second_double_word_48): - mov 52(%esi), %ecx - cmp %ecx, 52(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(next_two_double_words_48): - and $15, %dh - jz L(fourth_double_word_48) - mov 56(%esi), %ecx - cmp %ecx, 56(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(fourth_double_word_48): - mov 60(%esi), %ecx - cmp %ecx, 60(%edi) - jne L(nequal) - RETURN - - .p2align 4 -L(nequal): - mov $1, %eax - jg L(return) - neg %eax - RETURN - - .p2align 4 -L(return): - RETURN - - .p2align 4 -L(equal): - xorl %eax, %eax - RETURN - - CFI_POP (%edi) - CFI_POP (%esi) - - .p2align 4 -L(neq): - mov $1, %eax - jg L(neq_bigger) - neg %eax - -L(neq_bigger): - ret - - .p2align 4 -L(eq): - xorl %eax, %eax - ret - -END (__wcscmp_sse2) -#endif diff --git a/sysdeps/i386/i686/multiarch/wcscmp.S b/sysdeps/i386/i686/multiarch/wcscmp.S deleted file mode 100644 index db9c05af0d..0000000000 --- a/sysdeps/i386/i686/multiarch/wcscmp.S +++ /dev/null @@ -1,39 +0,0 @@ -/* Multiple versions of wcscmp - All versions must be listed in ifunc-impl-list.c. - Copyright (C) 2011-2015 Free Software Foundation, Inc. - Contributed by Intel Corporation. - This file is part of the GNU C Library. - - The GNU C Library is free software; you can redistribute it and/or - modify it under the terms of the GNU Lesser General Public - License as published by the Free Software Foundation; either - version 2.1 of the License, or (at your option) any later version. - - The GNU C Library is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU - Lesser General Public License for more details. - - You should have received a copy of the GNU Lesser General Public - License along with the GNU C Library; if not, see - <http://www.gnu.org/licenses/>. */ - -#include <sysdep.h> -#include <init-arch.h> - -/* Define multiple versions only for the definition in libc and for the - DSO. In static binaries, we need wcscmp before the initialization - happened. */ -#if IS_IN (libc) - .text -ENTRY(__wcscmp) - .type __wcscmp, @gnu_indirect_function - LOAD_GOT_AND_RTLD_GLOBAL_RO - LOAD_FUNC_GOT_EAX (__wcscmp_ia32) - HAS_CPU_FEATURE (SSE2) - jz 2f - LOAD_FUNC_GOT_EAX (__wcscmp_sse2) -2: ret -END(__wcscmp) -weak_alias (__wcscmp, wcscmp) -#endif |