96d6fd6c40
This patch adds an optimized POWER8 strcpy using unaligned accesses. For strings up to 16 bytes the implementation first calculate the string size, like strlen, and issues a memcpy. For larger strings, source is first aligned to 16 bytes and then tested over a loop that reads 16 bytes am combine the cmpb results for speedup. Special case is added for page cross reads. It shows 30%-60% improvement over the optimized POWER7 one that uses only aligned accesses.
35 lines
1.3 KiB
C
35 lines
1.3 KiB
C
/* Multiple versions of strcpy. PowerPC64 version.
|
|
Copyright (C) 2013-2015 Free Software Foundation, Inc.
|
|
This file is part of the GNU C Library.
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
modify it under the terms of the GNU Lesser General Public
|
|
License as published by the Free Software Foundation; either
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Lesser General Public License for more details.
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
License along with the GNU C Library; if not, see
|
|
<http://www.gnu.org/licenses/>. */
|
|
|
|
#if defined SHARED && IS_IN (libc)
|
|
# include <string.h>
|
|
# include <shlib-compat.h>
|
|
# include "init-arch.h"
|
|
|
|
extern __typeof (strcpy) __strcpy_ppc attribute_hidden;
|
|
extern __typeof (strcpy) __strcpy_power7 attribute_hidden;
|
|
extern __typeof (strcpy) __strcpy_power8 attribute_hidden;
|
|
|
|
libc_ifunc (strcpy,
|
|
(hwcap2 & PPC_FEATURE2_ARCH_2_07)
|
|
? __strcpy_power8 :
|
|
(hwcap & PPC_FEATURE_HAS_VSX)
|
|
? __strcpy_power7
|
|
: __strcpy_ppc);
|
|
#endif
|