glibc/sysdeps/i386/i686/multiarch/wcscmp-sse2.S

1019 lines
24 KiB
ArmAsm
Raw Normal View History

2011-09-05 13:53:27 -04:00
/* wcscmp with SSE2
Copyright (C) 2011-2014 Free Software Foundation, Inc.
2011-09-05 13:53:27 -04:00
Contributed by Intel Corporation.
This file is part of the GNU C Library.
The GNU C Library is free software; you can redistribute it and/or
modify it under the terms of the GNU Lesser General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
The GNU C Library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with the GNU C Library; if not, see
<http://www.gnu.org/licenses/>. */
2011-09-05 13:53:27 -04:00
Remove NOT_IN_libc Replace with !IS_IN (libc). This completes the transition from the IS_IN/NOT_IN macros to the IN_MODULE macro set. The generated code is unchanged on x86_64. * stdlib/isomac.c (fmt): Replace NOT_IN_libc with IN_MODULE. (get_null_defines): Adjust. * sunrpc/Makefile: Adjust comment. * Makerules (CPPFLAGS-nonlib): Remove NOT_IN_libc. * elf/Makefile (CPPFLAGS-sotruss-lib): Likewise. (CFLAGS-interp.c): Likewise. (CFLAGS-ldconfig.c): Likewise. (CPPFLAGS-.os): Likewise. * elf/rtld-Rules (rtld-CPPFLAGS): Likewise. * extra-lib.mk (CPPFLAGS-$(lib)): Likewise. * extra-modules.mk (extra-modules.mk): Likewise. * iconv/Makefile (CPPFLAGS-iconvprogs): Likewise. * locale/Makefile (CPPFLAGS-locale_programs): Likewise. * malloc/Makefile (CPPFLAGS-memusagestat): Likewise. * nscd/Makefile (CPPFLAGS-nscd): Likewise. * nss/Makefile (CPPFLAGS-nss_test1): Likewise. * stdlib/Makefile (CFLAGS-tst-putenvmod.c): Likewise. * sysdeps/gnu/Makefile ($(objpfx)errlist-compat.c): Likewise. * sysdeps/unix/sysv/linux/Makefile (CPPFLAGS-lddlibc4): Likewise. * iconvdata/Makefile (CPPFLAGS): Likewise. (cpp-srcs-left): Add libof for all iconvdata routines. * bits/stdio-lock.h: Replace NOT_IN_libc with IS_IN. * include/assert.h: Likewise. * include/ctype.h: Likewise. * include/errno.h: Likewise. * include/libc-symbols.h: Likewise. * include/math.h: Likewise. * include/netdb.h: Likewise. * include/resolv.h: Likewise. * include/stdio.h: Likewise. * include/stdlib.h: Likewise. * include/string.h: Likewise. * include/sys/stat.h: Likewise. * include/wctype.h: Likewise. * intl/l10nflist.c: Likewise. * libidn/idn-stub.c: Likewise. * libio/libioP.h: Likewise. * nptl/libc_multiple_threads.c: Likewise. * nptl/pthreadP.h: Likewise. * posix/regex_internal.h: Likewise. * resolv/res_hconf.c: Likewise. * sysdeps/arm/armv7/multiarch/memcpy.S: Likewise. * sysdeps/arm/memmove.S: Likewise. * sysdeps/arm/sysdep.h: Likewise. * sysdeps/generic/_itoa.h: Likewise. * sysdeps/generic/symbol-hacks.h: Likewise. * sysdeps/gnu/errlist.awk: Likewise. * sysdeps/gnu/errlist.c: Likewise. * sysdeps/i386/i586/memcpy.S: Likewise. * sysdeps/i386/i586/memset.S: Likewise. * sysdeps/i386/i686/memcpy.S: Likewise. * sysdeps/i386/i686/memmove.S: Likewise. * sysdeps/i386/i686/mempcpy.S: Likewise. * sysdeps/i386/i686/memset.S: Likewise. * sysdeps/i386/i686/multiarch/bcopy.S: Likewise. * sysdeps/i386/i686/multiarch/bzero.S: Likewise. * sysdeps/i386/i686/multiarch/memchr-sse2-bsf.S: Likewise. * sysdeps/i386/i686/multiarch/memchr-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/memchr.S: Likewise. * sysdeps/i386/i686/multiarch/memcmp-sse4.S: Likewise. * sysdeps/i386/i686/multiarch/memcmp-ssse3.S: Likewise. * sysdeps/i386/i686/multiarch/memcmp.S: Likewise. * sysdeps/i386/i686/multiarch/memcpy-ssse3-rep.S: Likewise. * sysdeps/i386/i686/multiarch/memcpy-ssse3.S: Likewise. * sysdeps/i386/i686/multiarch/memcpy.S: Likewise. * sysdeps/i386/i686/multiarch/memcpy_chk.S: Likewise. * sysdeps/i386/i686/multiarch/memmove.S: Likewise. * sysdeps/i386/i686/multiarch/memmove_chk.S: Likewise. * sysdeps/i386/i686/multiarch/mempcpy.S: Likewise. * sysdeps/i386/i686/multiarch/mempcpy_chk.S: Likewise. * sysdeps/i386/i686/multiarch/memrchr-c.c: Likewise. * sysdeps/i386/i686/multiarch/memrchr-sse2-bsf.S: Likewise. * sysdeps/i386/i686/multiarch/memrchr-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/memrchr.S: Likewise. * sysdeps/i386/i686/multiarch/memset-sse2-rep.S: Likewise. * sysdeps/i386/i686/multiarch/memset-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/memset.S: Likewise. * sysdeps/i386/i686/multiarch/memset_chk.S: Likewise. * sysdeps/i386/i686/multiarch/rawmemchr.S: Likewise. * sysdeps/i386/i686/multiarch/strcat-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/strcat-ssse3.S: Likewise. * sysdeps/i386/i686/multiarch/strcat.S: Likewise. * sysdeps/i386/i686/multiarch/strchr-sse2-bsf.S: Likewise. * sysdeps/i386/i686/multiarch/strchr-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/strchr.S: Likewise. * sysdeps/i386/i686/multiarch/strcmp-sse4.S: Likewise. * sysdeps/i386/i686/multiarch/strcmp-ssse3.S: Likewise. * sysdeps/i386/i686/multiarch/strcmp.S: Likewise. * sysdeps/i386/i686/multiarch/strcpy-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/strcpy-ssse3.S: Likewise. * sysdeps/i386/i686/multiarch/strcpy.S: Likewise. * sysdeps/i386/i686/multiarch/strcspn.S: Likewise. * sysdeps/i386/i686/multiarch/strlen-sse2-bsf.S: Likewise. * sysdeps/i386/i686/multiarch/strlen-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/strlen.S: Likewise. * sysdeps/i386/i686/multiarch/strnlen.S: Likewise. * sysdeps/i386/i686/multiarch/strrchr-sse2-bsf.S: Likewise. * sysdeps/i386/i686/multiarch/strrchr-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/strrchr.S: Likewise. * sysdeps/i386/i686/multiarch/strspn.S: Likewise. * sysdeps/i386/i686/multiarch/wcschr-c.c: Likewise. * sysdeps/i386/i686/multiarch/wcschr-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/wcschr.S: Likewise. * sysdeps/i386/i686/multiarch/wcscmp-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/wcscmp.S: Likewise. * sysdeps/i386/i686/multiarch/wcscpy-c.c: Likewise. * sysdeps/i386/i686/multiarch/wcscpy-ssse3.S: Likewise. * sysdeps/i386/i686/multiarch/wcscpy.S: Likewise. * sysdeps/i386/i686/multiarch/wcslen-c.c: Likewise. * sysdeps/i386/i686/multiarch/wcslen-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/wcslen.S: Likewise. * sysdeps/i386/i686/multiarch/wcsrchr-c.c: Likewise. * sysdeps/i386/i686/multiarch/wcsrchr-sse2.S: Likewise. * sysdeps/i386/i686/multiarch/wcsrchr.S: Likewise. * sysdeps/i386/i686/multiarch/wmemcmp-c.c: Likewise. * sysdeps/i386/i686/multiarch/wmemcmp.S: Likewise. * sysdeps/ia64/fpu/libm-symbols.h: Likewise. * sysdeps/nptl/bits/libc-lock.h: Likewise. * sysdeps/nptl/bits/libc-lockP.h: Likewise. * sysdeps/nptl/bits/stdio-lock.h: Likewise. * sysdeps/posix/closedir.c: Likewise. * sysdeps/posix/opendir.c: Likewise. * sysdeps/posix/readdir.c: Likewise. * sysdeps/posix/rewinddir.c: Likewise. * sysdeps/powerpc/novmx-sigjmp.c: Likewise. * sysdeps/powerpc/powerpc32/__longjmp.S: Likewise. * sysdeps/powerpc/powerpc32/bsd-_setjmp.S: Likewise. * sysdeps/powerpc/powerpc32/fpu/__longjmp.S: Likewise. * sysdeps/powerpc/powerpc32/fpu/setjmp.S: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/bzero.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memchr.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memcmp-ppc32.S: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memcmp.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memcpy-ppc32.S: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memcpy.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memmove.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/mempcpy.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memrchr-ppc32.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memrchr.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memset-ppc32.S: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/memset.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/rawmemchr.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strcasecmp.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strcasecmp_l.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strchr.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strchrnul.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strlen-ppc32.S: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strlen.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strncase.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strncase_l.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strncmp-ppc32.S: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strncmp.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/strnlen.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/wcschr-ppc32.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/wcschr.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/wcscpy-ppc32.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/wcscpy.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/wcsrchr-ppc32.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/wcsrchr.c: Likewise. * sysdeps/powerpc/powerpc32/power4/multiarch/wordcopy.c: Likewise. * sysdeps/powerpc/powerpc32/power6/memset.S: Likewise. * sysdeps/powerpc/powerpc32/setjmp.S: Likewise. * sysdeps/powerpc/powerpc64/__longjmp.S: Likewise. * sysdeps/powerpc/powerpc64/multiarch/bzero.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memchr.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memcmp-ppc64.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memcmp.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memcpy-ppc64.S: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memcpy.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memmove-ppc64.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memmove.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/mempcpy.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memrchr.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memset-ppc64.S: Likewise. * sysdeps/powerpc/powerpc64/multiarch/memset.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/rawmemchr.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/stpcpy-ppc64.S: Likewise. * sysdeps/powerpc/powerpc64/multiarch/stpcpy.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/stpncpy.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strcasecmp.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strcasecmp_l.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strcat.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strchr.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strchrnul.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strcmp-ppc64.S: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strcmp.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strcpy-ppc64.S: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strcpy.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strcspn.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strlen-ppc64.S: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strlen.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strncase.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strncase_l.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strncat.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strncmp-ppc64.S: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strncmp.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strncpy-ppc64.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strncpy.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strnlen.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strpbrk.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strrchr-ppc64.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strrchr.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strspn-ppc64.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/strspn.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/wcschr.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/wcscpy.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/wcsrchr.c: Likewise. * sysdeps/powerpc/powerpc64/multiarch/wordcopy.c: Likewise. * sysdeps/powerpc/powerpc64/setjmp.S: Likewise. * sysdeps/s390/s390-32/multiarch/ifunc-resolve.c: Likewise. * sysdeps/s390/s390-32/multiarch/memcmp.S: Likewise. * sysdeps/s390/s390-32/multiarch/memcpy.S: Likewise. * sysdeps/s390/s390-32/multiarch/memset.S: Likewise. * sysdeps/s390/s390-64/multiarch/ifunc-resolve.c: Likewise. * sysdeps/s390/s390-64/multiarch/memcmp.S: Likewise. * sysdeps/s390/s390-64/multiarch/memcpy.S: Likewise. * sysdeps/s390/s390-64/multiarch/memset.S: Likewise. * sysdeps/sparc/sparc64/multiarch/memcpy-niagara1.S: Likewise. * sysdeps/sparc/sparc64/multiarch/memcpy-niagara2.S: Likewise. * sysdeps/sparc/sparc64/multiarch/memcpy-niagara4.S: Likewise. * sysdeps/sparc/sparc64/multiarch/memcpy-ultra3.S: Likewise. * sysdeps/sparc/sparc64/multiarch/memcpy.S: Likewise. * sysdeps/sparc/sparc64/multiarch/memset-niagara1.S: Likewise. * sysdeps/sparc/sparc64/multiarch/memset-niagara4.S: Likewise. * sysdeps/sparc/sparc64/multiarch/memset.S: Likewise. * sysdeps/unix/alpha/sysdep.S: Likewise. * sysdeps/unix/alpha/sysdep.h: Likewise. * sysdeps/unix/make-syscalls.sh: Likewise. * sysdeps/unix/sysv/linux/aarch64/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/aarch64/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/alpha/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/alpha/vfork.S: Likewise. * sysdeps/unix/sysv/linux/arm/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/arm/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/getpid.c: Likewise. * sysdeps/unix/sysv/linux/hppa/nptl/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/hppa/nptl/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/i386/i486/lowlevellock.S: Likewise. * sysdeps/unix/sysv/linux/i386/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/i386/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/i386/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/ia64/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/ia64/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/ia64/sysdep.S: Likewise. * sysdeps/unix/sysv/linux/ia64/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/lowlevellock-futex.h: Likewise. * sysdeps/unix/sysv/linux/m68k/bits/m68k-vdso.h: Likewise. * sysdeps/unix/sysv/linux/m68k/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/m68k/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/microblaze/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/microblaze/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/mips/mips64/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/mips/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/not-cancel.h: Likewise. * sysdeps/unix/sysv/linux/powerpc/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/powerpc/powerpc32/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/powerpc/powerpc64/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/s390/longjmp_chk.c: Likewise. * sysdeps/unix/sysv/linux/s390/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/s390/s390-32/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/s390/s390-32/sysdep.S: Likewise. * sysdeps/unix/sysv/linux/s390/s390-32/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/s390/s390-32/vfork.S: Likewise. * sysdeps/unix/sysv/linux/s390/s390-64/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/s390/s390-64/sysdep.S: Likewise. * sysdeps/unix/sysv/linux/s390/s390-64/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/s390/s390-64/vfork.S: Likewise. * sysdeps/unix/sysv/linux/sh/lowlevellock.S: Likewise. * sysdeps/unix/sysv/linux/sh/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/sh/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/sh/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/sh/vfork.S: Likewise. * sysdeps/unix/sysv/linux/sparc/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/sparc/sparc32/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/sparc/sparc32/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/sparc/sparc64/brk.S: Likewise. * sysdeps/unix/sysv/linux/sparc/sparc64/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/sparc/sparc64/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/tile/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/tile/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/tile/sysdep.h: Likewise. * sysdeps/unix/sysv/linux/tile/waitpid.S: Likewise. * sysdeps/unix/sysv/linux/x86_64/lowlevellock.S: Likewise. * sysdeps/unix/sysv/linux/x86_64/lowlevellock.h: Likewise. * sysdeps/unix/sysv/linux/x86_64/sysdep-cancel.h: Likewise. * sysdeps/unix/sysv/linux/x86_64/sysdep.h: Likewise. * sysdeps/wordsize-32/symbol-hacks.h: Likewise. * sysdeps/x86_64/memcpy.S: Likewise. * sysdeps/x86_64/memmove.c: Likewise. * sysdeps/x86_64/memset.S: Likewise. * sysdeps/x86_64/multiarch/init-arch.h: Likewise. * sysdeps/x86_64/multiarch/memcmp-sse4.S: Likewise. * sysdeps/x86_64/multiarch/memcmp-ssse3.S: Likewise. * sysdeps/x86_64/multiarch/memcmp.S: Likewise. * sysdeps/x86_64/multiarch/memcpy-avx-unaligned.S: Likewise. * sysdeps/x86_64/multiarch/memcpy-ssse3-back.S: Likewise. * sysdeps/x86_64/multiarch/memcpy-ssse3.S: Likewise. * sysdeps/x86_64/multiarch/memcpy.S: Likewise. * sysdeps/x86_64/multiarch/memcpy_chk.S: Likewise. * sysdeps/x86_64/multiarch/memmove.c: Likewise. * sysdeps/x86_64/multiarch/mempcpy.S: Likewise. * sysdeps/x86_64/multiarch/mempcpy_chk.S: Likewise. * sysdeps/x86_64/multiarch/memset-avx2.S: Likewise. * sysdeps/x86_64/multiarch/memset.S: Likewise. * sysdeps/x86_64/multiarch/memset_chk.S: Likewise. * sysdeps/x86_64/multiarch/strcat-sse2-unaligned.S: Likewise. * sysdeps/x86_64/multiarch/strcat-ssse3.S: Likewise. * sysdeps/x86_64/multiarch/strcat.S: Likewise. * sysdeps/x86_64/multiarch/strchr-sse2-no-bsf.S: Likewise. * sysdeps/x86_64/multiarch/strchr.S: Likewise. * sysdeps/x86_64/multiarch/strcmp-ssse3.S: Likewise. * sysdeps/x86_64/multiarch/strcmp.S: Likewise. * sysdeps/x86_64/multiarch/strcpy-sse2-unaligned.S: Likewise. * sysdeps/x86_64/multiarch/strcpy-ssse3.S: Likewise. * sysdeps/x86_64/multiarch/strcpy.S: Likewise. * sysdeps/x86_64/multiarch/strcspn.S: Likewise. * sysdeps/x86_64/multiarch/strspn.S: Likewise. * sysdeps/x86_64/multiarch/wcscpy-c.c: Likewise. * sysdeps/x86_64/multiarch/wcscpy-ssse3.S: Likewise. * sysdeps/x86_64/multiarch/wcscpy.S: Likewise. * sysdeps/x86_64/multiarch/wmemcmp-c.c: Likewise. * sysdeps/x86_64/multiarch/wmemcmp.S: Likewise. * sysdeps/x86_64/strcmp.S: Likewise.
2014-11-24 15:03:45 +05:30
#if IS_IN (libc)
2011-09-05 13:53:27 -04:00
# include <sysdep.h>
# define CFI_PUSH(REG) \
cfi_adjust_cfa_offset (4); \
cfi_rel_offset (REG, 0)
# define CFI_POP(REG) \
cfi_adjust_cfa_offset (-4); \
cfi_restore (REG)
# define PUSH(REG) pushl REG; CFI_PUSH (REG)
# define POP(REG) popl REG; CFI_POP (REG)
# define ENTRANCE PUSH(%esi); PUSH(%edi)
# define RETURN POP(%edi); POP(%esi); ret; CFI_PUSH(%esi); CFI_PUSH(%edi);
# define PARMS 4
# define STR1 PARMS
# define STR2 STR1+4
2011-10-23 13:34:15 -04:00
/* Note: wcscmp uses signed comparison, not unsugned as in strcmp function. */
2011-09-05 13:53:27 -04:00
.text
2011-10-23 13:34:15 -04:00
ENTRY (__wcscmp_sse2)
2011-09-05 13:53:27 -04:00
/*
* This implementation uses SSE to compare up to 16 bytes at a time.
*/
mov STR1(%esp), %edx
mov STR2(%esp), %eax
mov (%eax), %ecx
cmp %ecx, (%edx)
jne L(neq)
test %ecx, %ecx
jz L(eq)
mov 4(%eax), %ecx
cmp %ecx, 4(%edx)
jne L(neq)
test %ecx, %ecx
jz L(eq)
mov 8(%eax), %ecx
cmp %ecx, 8(%edx)
jne L(neq)
test %ecx, %ecx
jz L(eq)
mov 12(%eax), %ecx
cmp %ecx, 12(%edx)
jne L(neq)
test %ecx, %ecx
jz L(eq)
ENTRANCE
add $16, %eax
add $16, %edx
mov %eax, %esi
mov %edx, %edi
pxor %xmm0, %xmm0 /* clear %xmm0 for null char checks */
mov %al, %ch
mov %dl, %cl
and $63, %eax /* esi alignment in cache line */
and $63, %edx /* edi alignment in cache line */
and $15, %cl
jz L(continue_00)
cmp $16, %edx
jb L(continue_0)
cmp $32, %edx
jb L(continue_16)
cmp $48, %edx
jb L(continue_32)
L(continue_48):
and $15, %ch
jz L(continue_48_00)
cmp $16, %eax
jb L(continue_0_48)
cmp $32, %eax
jb L(continue_16_48)
cmp $48, %eax
jb L(continue_32_48)
.p2align 4
L(continue_48_48):
mov (%esi), %ecx
cmp %ecx, (%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 4(%esi), %ecx
cmp %ecx, 4(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 8(%esi), %ecx
cmp %ecx, 8(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 12(%esi), %ecx
cmp %ecx, 12(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
2011-10-23 13:35:24 -04:00
2011-09-05 13:53:27 -04:00
movdqu 16(%edi), %xmm1
movdqu 16(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
movdqu 32(%edi), %xmm1
movdqu 32(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
movdqu 48(%edi), %xmm1
movdqu 48(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_48)
add $64, %esi
add $64, %edi
jmp L(continue_48_48)
L(continue_0):
and $15, %ch
jz L(continue_0_00)
cmp $16, %eax
jb L(continue_0_0)
cmp $32, %eax
jb L(continue_0_16)
cmp $48, %eax
jb L(continue_0_32)
.p2align 4
L(continue_0_48):
mov (%esi), %ecx
cmp %ecx, (%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 4(%esi), %ecx
cmp %ecx, 4(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 8(%esi), %ecx
cmp %ecx, 8(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 12(%esi), %ecx
cmp %ecx, 12(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
movdqu 16(%edi), %xmm1
movdqu 16(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
movdqu 32(%edi), %xmm1
movdqu 32(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
mov 48(%esi), %ecx
cmp %ecx, 48(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 52(%esi), %ecx
cmp %ecx, 52(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 56(%esi), %ecx
cmp %ecx, 56(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 60(%esi), %ecx
cmp %ecx, 60(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
add $64, %esi
add $64, %edi
jmp L(continue_0_48)
.p2align 4
L(continue_00):
and $15, %ch
jz L(continue_00_00)
cmp $16, %eax
jb L(continue_00_0)
cmp $32, %eax
jb L(continue_00_16)
cmp $48, %eax
jb L(continue_00_32)
.p2align 4
L(continue_00_48):
pcmpeqd (%edi), %xmm0
mov (%edi), %eax
pmovmskb %xmm0, %ecx
test %ecx, %ecx
jnz L(less4_double_words1)
2011-10-23 13:34:15 -04:00
cmp (%esi), %eax
jne L(nequal)
2011-10-23 13:35:24 -04:00
2011-09-05 13:53:27 -04:00
mov 4(%edi), %eax
2011-10-23 13:34:15 -04:00
cmp 4(%esi), %eax
jne L(nequal)
2011-09-05 13:53:27 -04:00
mov 8(%edi), %eax
2011-10-23 13:34:15 -04:00
cmp 8(%esi), %eax
jne L(nequal)
2011-09-05 13:53:27 -04:00
mov 12(%edi), %eax
2011-10-23 13:34:15 -04:00
cmp 12(%esi), %eax
jne L(nequal)
2011-10-23 13:35:24 -04:00
2011-09-05 13:53:27 -04:00
movdqu 16(%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd 16(%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
movdqu 32(%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd 32(%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
movdqu 48(%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd 48(%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_48)
add $64, %esi
add $64, %edi
jmp L(continue_00_48)
.p2align 4
L(continue_32):
and $15, %ch
jz L(continue_32_00)
cmp $16, %eax
jb L(continue_0_32)
cmp $32, %eax
jb L(continue_16_32)
cmp $48, %eax
jb L(continue_32_32)
.p2align 4
L(continue_32_48):
mov (%esi), %ecx
cmp %ecx, (%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 4(%esi), %ecx
cmp %ecx, 4(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 8(%esi), %ecx
cmp %ecx, 8(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 12(%esi), %ecx
cmp %ecx, 12(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 16(%esi), %ecx
cmp %ecx, 16(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 20(%esi), %ecx
cmp %ecx, 20(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 24(%esi), %ecx
cmp %ecx, 24(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 28(%esi), %ecx
cmp %ecx, 28(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
movdqu 32(%edi), %xmm1
movdqu 32(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
movdqu 48(%edi), %xmm1
movdqu 48(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
2011-10-23 13:34:15 -04:00
psubb %xmm0, %xmm1 /* packed sub of comparison results */
2011-09-05 13:53:27 -04:00
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_48)
add $64, %esi
add $64, %edi
jmp L(continue_32_48)
.p2align 4
L(continue_16):
and $15, %ch
jz L(continue_16_00)
cmp $16, %eax
jb L(continue_0_16)
cmp $32, %eax
jb L(continue_16_16)
cmp $48, %eax
jb L(continue_16_32)
.p2align 4
L(continue_16_48):
mov (%esi), %ecx
cmp %ecx, (%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 4(%esi), %ecx
cmp %ecx, 4(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 8(%esi), %ecx
cmp %ecx, 8(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 12(%esi), %ecx
cmp %ecx, 12(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
movdqu 16(%edi), %xmm1
movdqu 16(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
mov 32(%esi), %ecx
cmp %ecx, 32(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 36(%esi), %ecx
cmp %ecx, 36(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 40(%esi), %ecx
cmp %ecx, 40(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 44(%esi), %ecx
cmp %ecx, 44(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
movdqu 48(%edi), %xmm1
movdqu 48(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_48)
add $64, %esi
add $64, %edi
jmp L(continue_16_48)
.p2align 4
L(continue_00_00):
movdqa (%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd (%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
movdqa 16(%edi), %xmm3
pcmpeqd %xmm3, %xmm0 /* Any null double_word? */
pcmpeqd 16(%esi), %xmm3 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm3 /* packed sub of comparison results*/
pmovmskb %xmm3, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
movdqa 32(%edi), %xmm5
pcmpeqd %xmm5, %xmm0 /* Any null double_word? */
pcmpeqd 32(%esi), %xmm5 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm5 /* packed sub of comparison results*/
pmovmskb %xmm5, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
movdqa 48(%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd 48(%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_48)
add $64, %esi
add $64, %edi
jmp L(continue_00_00)
.p2align 4
L(continue_00_32):
movdqu (%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd (%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
add $16, %esi
add $16, %edi
jmp L(continue_00_48)
.p2align 4
L(continue_00_16):
movdqu (%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd (%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
movdqu 16(%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd 16(%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
add $32, %esi
add $32, %edi
jmp L(continue_00_48)
.p2align 4
L(continue_00_0):
movdqu (%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd (%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
movdqu 16(%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd 16(%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
movdqu 32(%esi), %xmm2
pcmpeqd %xmm2, %xmm0 /* Any null double_word? */
pcmpeqd 32(%edi), %xmm2 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm2 /* packed sub of comparison results*/
pmovmskb %xmm2, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
add $48, %esi
add $48, %edi
jmp L(continue_00_48)
.p2align 4
L(continue_48_00):
pcmpeqd (%esi), %xmm0
mov (%edi), %eax
pmovmskb %xmm0, %ecx
test %ecx, %ecx
jnz L(less4_double_words1)
2011-10-23 13:34:15 -04:00
cmp (%esi), %eax
jne L(nequal)
2011-10-23 13:35:24 -04:00
2011-09-05 13:53:27 -04:00
mov 4(%edi), %eax
2011-10-23 13:34:15 -04:00
cmp 4(%esi), %eax
jne L(nequal)
2011-09-05 13:53:27 -04:00
mov 8(%edi), %eax
2011-10-23 13:34:15 -04:00
cmp 8(%esi), %eax
jne L(nequal)
2011-09-05 13:53:27 -04:00
mov 12(%edi), %eax
2011-10-23 13:34:15 -04:00
cmp 12(%esi), %eax
jne L(nequal)
2011-10-23 13:35:24 -04:00
2011-09-05 13:53:27 -04:00
movdqu 16(%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd 16(%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
movdqu 32(%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd 32(%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
movdqu 48(%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd 48(%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_48)
add $64, %esi
add $64, %edi
jmp L(continue_48_00)
.p2align 4
L(continue_32_00):
movdqu (%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd (%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
add $16, %esi
add $16, %edi
jmp L(continue_48_00)
.p2align 4
L(continue_16_00):
movdqu (%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd (%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
movdqu 16(%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd 16(%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
add $32, %esi
add $32, %edi
jmp L(continue_48_00)
.p2align 4
L(continue_0_00):
movdqu (%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd (%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
movdqu 16(%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd 16(%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
movdqu 32(%edi), %xmm1
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd 32(%esi), %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
add $48, %esi
add $48, %edi
jmp L(continue_48_00)
.p2align 4
L(continue_32_32):
movdqu (%edi), %xmm1
movdqu (%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
add $16, %esi
add $16, %edi
jmp L(continue_48_48)
.p2align 4
L(continue_16_16):
movdqu (%edi), %xmm1
movdqu (%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
movdqu 16(%edi), %xmm3
movdqu 16(%esi), %xmm4
pcmpeqd %xmm3, %xmm0 /* Any null double_word? */
pcmpeqd %xmm4, %xmm3 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm3 /* packed sub of comparison results*/
pmovmskb %xmm3, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
add $32, %esi
add $32, %edi
jmp L(continue_48_48)
.p2align 4
L(continue_0_0):
movdqu (%edi), %xmm1
movdqu (%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
movdqu 16(%edi), %xmm3
movdqu 16(%esi), %xmm4
pcmpeqd %xmm3, %xmm0 /* Any null double_word? */
pcmpeqd %xmm4, %xmm3 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm3 /* packed sub of comparison results*/
pmovmskb %xmm3, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
movdqu 32(%edi), %xmm1
movdqu 32(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_32)
add $48, %esi
add $48, %edi
jmp L(continue_48_48)
.p2align 4
L(continue_0_16):
movdqu (%edi), %xmm1
movdqu (%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
movdqu 16(%edi), %xmm1
movdqu 16(%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words_16)
add $32, %esi
add $32, %edi
jmp L(continue_32_48)
.p2align 4
L(continue_0_32):
movdqu (%edi), %xmm1
movdqu (%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
add $16, %esi
add $16, %edi
jmp L(continue_16_48)
.p2align 4
L(continue_16_32):
movdqu (%edi), %xmm1
movdqu (%esi), %xmm2
pcmpeqd %xmm1, %xmm0 /* Any null double_word? */
pcmpeqd %xmm2, %xmm1 /* compare first 4 double_words for equality */
psubb %xmm0, %xmm1 /* packed sub of comparison results*/
pmovmskb %xmm1, %edx
sub $0xffff, %edx /* if first 4 double_words are same, edx == 0xffff */
jnz L(less4_double_words)
add $16, %esi
add $16, %edi
jmp L(continue_32_48)
.p2align 4
L(less4_double_words1):
cmp (%esi), %eax
jne L(nequal)
test %eax, %eax
jz L(equal)
mov 4(%esi), %ecx
cmp %ecx, 4(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
mov 8(%esi), %ecx
cmp %ecx, 8(%edi)
jne L(nequal)
test %ecx, %ecx
jz L(equal)
2011-10-23 13:34:15 -04:00
mov 12(%esi), %ecx
cmp %ecx, 12(%edi)
jne L(nequal)
xor %eax, %eax
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(less4_double_words):
2011-10-23 13:34:15 -04:00
xor %eax, %eax
2011-09-05 13:53:27 -04:00
test %dl, %dl
jz L(next_two_double_words)
and $15, %dl
jz L(second_double_word)
2011-10-23 13:34:15 -04:00
mov (%esi), %ecx
cmp %ecx, (%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(second_double_word):
2011-10-23 13:34:15 -04:00
mov 4(%esi), %ecx
cmp %ecx, 4(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(next_two_double_words):
and $15, %dh
jz L(fourth_double_word)
2011-10-23 13:34:15 -04:00
mov 8(%esi), %ecx
cmp %ecx, 8(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(fourth_double_word):
2011-10-23 13:34:15 -04:00
mov 12(%esi), %ecx
cmp %ecx, 12(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(less4_double_words_16):
2011-10-23 13:34:15 -04:00
xor %eax, %eax
2011-09-05 13:53:27 -04:00
test %dl, %dl
jz L(next_two_double_words_16)
and $15, %dl
jz L(second_double_word_16)
2011-10-23 13:34:15 -04:00
mov 16(%esi), %ecx
cmp %ecx, 16(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(second_double_word_16):
2011-10-23 13:34:15 -04:00
mov 20(%esi), %ecx
cmp %ecx, 20(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(next_two_double_words_16):
and $15, %dh
jz L(fourth_double_word_16)
2011-10-23 13:34:15 -04:00
mov 24(%esi), %ecx
cmp %ecx, 24(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(fourth_double_word_16):
2011-10-23 13:34:15 -04:00
mov 28(%esi), %ecx
cmp %ecx, 28(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(less4_double_words_32):
2011-10-23 13:34:15 -04:00
xor %eax, %eax
2011-09-05 13:53:27 -04:00
test %dl, %dl
jz L(next_two_double_words_32)
and $15, %dl
jz L(second_double_word_32)
2011-10-23 13:34:15 -04:00
mov 32(%esi), %ecx
cmp %ecx, 32(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(second_double_word_32):
2011-10-23 13:34:15 -04:00
mov 36(%esi), %ecx
cmp %ecx, 36(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(next_two_double_words_32):
and $15, %dh
jz L(fourth_double_word_32)
2011-10-23 13:34:15 -04:00
mov 40(%esi), %ecx
cmp %ecx, 40(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(fourth_double_word_32):
2011-10-23 13:34:15 -04:00
mov 44(%esi), %ecx
cmp %ecx, 44(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(less4_double_words_48):
2011-10-23 13:34:15 -04:00
xor %eax, %eax
2011-09-05 13:53:27 -04:00
test %dl, %dl
jz L(next_two_double_words_48)
and $15, %dl
jz L(second_double_word_48)
2011-10-23 13:34:15 -04:00
mov 48(%esi), %ecx
cmp %ecx, 48(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(second_double_word_48):
2011-10-23 13:34:15 -04:00
mov 52(%esi), %ecx
cmp %ecx, 52(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(next_two_double_words_48):
and $15, %dh
jz L(fourth_double_word_48)
2011-10-23 13:34:15 -04:00
mov 56(%esi), %ecx
cmp %ecx, 56(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(fourth_double_word_48):
2011-10-23 13:34:15 -04:00
mov 60(%esi), %ecx
cmp %ecx, 60(%edi)
jne L(nequal)
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(nequal):
mov $1, %eax
2011-10-23 13:34:15 -04:00
jg L(return)
2011-09-05 13:53:27 -04:00
neg %eax
2011-10-23 13:34:15 -04:00
RETURN
2011-09-05 13:53:27 -04:00
2011-10-23 13:34:15 -04:00
.p2align 4
L(return):
2011-09-05 13:53:27 -04:00
RETURN
.p2align 4
L(equal):
xorl %eax, %eax
RETURN
CFI_POP (%edi)
CFI_POP (%esi)
.p2align 4
L(neq):
mov $1, %eax
2011-10-23 13:34:15 -04:00
jg L(neq_bigger)
2011-09-05 13:53:27 -04:00
neg %eax
L(neq_bigger):
ret
.p2align 4
L(eq):
xorl %eax, %eax
ret
2011-10-23 13:34:15 -04:00
END (__wcscmp_sse2)
2011-09-05 13:53:27 -04:00
#endif