2013-12-13 19:31:41 +00:00
|
|
|
/* Enumerate available IFUNC implementations of a function. PowerPC64 version.
|
2023-01-06 21:08:04 +00:00
|
|
|
Copyright (C) 2013-2023 Free Software Foundation, Inc.
|
2013-12-13 19:31:41 +00:00
|
|
|
This file is part of the GNU C Library.
|
|
|
|
|
|
|
|
|
|
The GNU C Library is free software; you can redistribute it and/or
|
|
|
|
|
modify it under the terms of the GNU Lesser General Public
|
|
|
|
|
License as published by the Free Software Foundation; either
|
|
|
|
|
version 2.1 of the License, or (at your option) any later version.
|
|
|
|
|
|
|
|
|
|
The GNU C Library is distributed in the hope that it will be useful,
|
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
|
Lesser General Public License for more details.
|
|
|
|
|
|
|
|
|
|
You should have received a copy of the GNU Lesser General Public
|
|
|
|
|
License along with the GNU C Library; if not, see
|
Prefer https to http for gnu.org and fsf.org URLs
Also, change sources.redhat.com to sourceware.org.
This patch was automatically generated by running the following shell
script, which uses GNU sed, and which avoids modifying files imported
from upstream:
sed -ri '
s,(http|ftp)(://(.*\.)?(gnu|fsf|sourceware)\.org($|[^.]|\.[^a-z])),https\2,g
s,(http|ftp)(://(.*\.)?)sources\.redhat\.com($|[^.]|\.[^a-z]),https\2sourceware.org\4,g
' \
$(find $(git ls-files) -prune -type f \
! -name '*.po' \
! -name 'ChangeLog*' \
! -path COPYING ! -path COPYING.LIB \
! -path manual/fdl-1.3.texi ! -path manual/lgpl-2.1.texi \
! -path manual/texinfo.tex ! -path scripts/config.guess \
! -path scripts/config.sub ! -path scripts/install-sh \
! -path scripts/mkinstalldirs ! -path scripts/move-if-change \
! -path INSTALL ! -path locale/programs/charmap-kw.h \
! -path po/libc.pot ! -path sysdeps/gnu/errlist.c \
! '(' -name configure \
-execdir test -f configure.ac -o -f configure.in ';' ')' \
! '(' -name preconfigure \
-execdir test -f preconfigure.ac ';' ')' \
-print)
and then by running 'make dist-prepare' to regenerate files built
from the altered files, and then executing the following to cleanup:
chmod a+x sysdeps/unix/sysv/linux/riscv/configure
# Omit irrelevant whitespace and comment-only changes,
# perhaps from a slightly-different Autoconf version.
git checkout -f \
sysdeps/csky/configure \
sysdeps/hppa/configure \
sysdeps/riscv/configure \
sysdeps/unix/sysv/linux/csky/configure
# Omit changes that caused a pre-commit check to fail like this:
# remote: *** error: sysdeps/powerpc/powerpc64/ppc-mcount.S: trailing lines
git checkout -f \
sysdeps/powerpc/powerpc64/ppc-mcount.S \
sysdeps/unix/sysv/linux/s390/s390-64/syscall.S
# Omit change that caused a pre-commit check to fail like this:
# remote: *** error: sysdeps/sparc/sparc64/multiarch/memcpy-ultra3.S: last line does not end in newline
git checkout -f sysdeps/sparc/sparc64/multiarch/memcpy-ultra3.S
2019-09-07 05:40:42 +00:00
|
|
|
<https://www.gnu.org/licenses/>. */
|
2013-12-13 19:31:41 +00:00
|
|
|
|
|
|
|
|
#include <assert.h>
|
2023-08-01 12:41:17 +00:00
|
|
|
#include <cpu-features.h>
|
2013-12-13 19:31:41 +00:00
|
|
|
#include <string.h>
|
|
|
|
|
#include <wchar.h>
|
|
|
|
|
#include <ldsodefs.h>
|
|
|
|
|
#include <ifunc-impl-list.h>
|
|
|
|
|
|
|
|
|
|
size_t
|
|
|
|
|
__libc_ifunc_impl_list (const char *name, struct libc_ifunc_impl *array,
|
|
|
|
|
size_t max)
|
|
|
|
|
{
|
2022-06-10 16:13:29 +00:00
|
|
|
size_t i = max;
|
2023-08-01 12:41:17 +00:00
|
|
|
const struct cpu_features *features = &GLRO(dl_powerpc_cpu_features);
|
|
|
|
|
unsigned long int hwcap = features->hwcap;
|
|
|
|
|
unsigned long int hwcap2 = features->hwcap2;
|
2021-07-27 05:47:50 +00:00
|
|
|
#ifdef SHARED
|
|
|
|
|
int cacheline_size = GLRO(dl_cache_line_size);
|
|
|
|
|
#endif
|
2014-07-15 16:19:09 +00:00
|
|
|
|
2013-12-13 19:31:41 +00:00
|
|
|
/* hwcap contains only the latest supported ISA, the code checks which is
|
|
|
|
|
and fills the previous supported ones. */
|
|
|
|
|
if (hwcap & PPC_FEATURE_ARCH_2_06)
|
|
|
|
|
hwcap |= PPC_FEATURE_ARCH_2_05 | PPC_FEATURE_POWER5_PLUS |
|
|
|
|
|
PPC_FEATURE_POWER5 | PPC_FEATURE_POWER4;
|
|
|
|
|
else if (hwcap & PPC_FEATURE_ARCH_2_05)
|
|
|
|
|
hwcap |= PPC_FEATURE_POWER5_PLUS | PPC_FEATURE_POWER5 | PPC_FEATURE_POWER4;
|
|
|
|
|
else if (hwcap & PPC_FEATURE_POWER5_PLUS)
|
|
|
|
|
hwcap |= PPC_FEATURE_POWER5 | PPC_FEATURE_POWER4;
|
|
|
|
|
else if (hwcap & PPC_FEATURE_POWER5)
|
|
|
|
|
hwcap |= PPC_FEATURE_POWER4;
|
|
|
|
|
|
|
|
|
|
#ifdef SHARED
|
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memcpy.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, memcpy,
|
2021-04-30 21:12:08 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcpy,
|
|
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_3_1
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
|
|
|
|
__memcpy_power10)
|
|
|
|
|
#endif
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2017-12-11 19:39:42 +00:00
|
|
|
__memcpy_power8_cached)
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_ARCH_2_06
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2013-12-13 19:31:41 +00:00
|
|
|
__memcpy_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_ARCH_2_06,
|
|
|
|
|
__memcpy_a2)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_ARCH_2_05,
|
|
|
|
|
__memcpy_power6)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_CELL_BE,
|
|
|
|
|
__memcpy_cell)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcpy, hwcap & PPC_FEATURE_POWER4,
|
|
|
|
|
__memcpy_power4)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcpy, 1, __memcpy_ppc))
|
2013-12-13 19:33:16 +00:00
|
|
|
|
2014-06-20 17:55:16 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memmove.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, memmove,
|
2021-04-30 21:12:08 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memmove,
|
2021-05-03 19:59:35 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_3_1
|
|
|
|
|
&& hwcap2 & PPC_FEATURE2_HAS_ISEL
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2021-04-30 21:12:08 +00:00
|
|
|
__memmove_power10)
|
|
|
|
|
#endif
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memmove, hwcap & PPC_FEATURE_ARCH_2_06
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2014-06-20 17:55:16 +00:00
|
|
|
__memmove_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memmove, 1, __memmove_ppc))
|
|
|
|
|
|
2013-12-13 19:33:16 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memset.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, memset,
|
2021-04-30 21:12:08 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memset,
|
2021-05-03 19:59:35 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_3_1
|
|
|
|
|
&& hwcap2 & PPC_FEATURE2_HAS_ISEL
|
2021-07-27 05:47:50 +00:00
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX
|
|
|
|
|
&& cacheline_size == 128,
|
2021-04-30 21:12:08 +00:00
|
|
|
__memset_power10)
|
|
|
|
|
#endif
|
2021-07-27 05:47:50 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memset, hwcap2 & PPC_FEATURE2_ARCH_2_07
|
2021-07-27 05:47:51 +00:00
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC
|
2021-07-27 05:47:50 +00:00
|
|
|
&& cacheline_size == 128,
|
2014-07-15 16:19:09 +00:00
|
|
|
__memset_power8)
|
2021-07-27 05:47:50 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memset, hwcap & PPC_FEATURE_ARCH_2_06
|
|
|
|
|
&& cacheline_size == 128,
|
2013-12-13 19:33:16 +00:00
|
|
|
__memset_power7)
|
2021-07-27 05:47:50 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memset, hwcap & PPC_FEATURE_ARCH_2_05
|
|
|
|
|
&& cacheline_size == 128,
|
2013-12-13 19:33:16 +00:00
|
|
|
__memset_power6)
|
2021-07-27 05:47:50 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memset, hwcap & PPC_FEATURE_POWER4
|
|
|
|
|
&& cacheline_size == 128,
|
2013-12-13 19:33:16 +00:00
|
|
|
__memset_power4)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memset, 1, __memset_ppc))
|
2013-12-13 19:38:17 +00:00
|
|
|
|
2013-12-13 19:54:41 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcpy.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strcpy,
|
2020-05-13 23:00:26 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcpy, hwcap2 & PPC_FEATURE2_ARCH_3_00
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2020-05-13 23:00:26 +00:00
|
|
|
__strcpy_power9)
|
|
|
|
|
#endif
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcpy, hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2014-12-23 11:59:44 +00:00
|
|
|
__strcpy_power8)
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcpy, hwcap & PPC_FEATURE_ARCH_2_06
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2013-12-13 19:54:41 +00:00
|
|
|
__strcpy_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcpy, 1,
|
|
|
|
|
__strcpy_ppc))
|
|
|
|
|
|
2013-12-13 19:55:22 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/stpcpy.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, stpcpy,
|
2020-05-13 23:08:35 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, hwcap2 & PPC_FEATURE2_ARCH_3_00
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2020-05-13 23:08:35 +00:00
|
|
|
__stpcpy_power9)
|
|
|
|
|
#endif
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2014-12-23 11:59:44 +00:00
|
|
|
__stpcpy_power8)
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, hwcap & PPC_FEATURE_ARCH_2_06
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2013-12-13 19:55:22 +00:00
|
|
|
__stpcpy_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, stpcpy, 1,
|
|
|
|
|
__stpcpy_ppc))
|
|
|
|
|
|
2013-12-13 19:38:17 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strlen.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strlen,
|
2020-05-18 16:16:06 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strlen, hwcap2 & PPC_FEATURE2_ARCH_3_1
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
powerpc: Add optimized strlen for POWER10
Improvements compared to POWER9 version:
1. Take into account first 16B comparison for aligned strings
The previous version compares the first 16B and increments r4 by the number
of bytes until the address is 16B-aligned, then starts doing aligned loads at
that address. For aligned strings, this causes the first 16B to be compared
twice, because the increment is 0. Here we calculate the next 16B-aligned
address differently, which avoids that issue.
2. Use simple comparisons for the first ~192 bytes
The main loop is good for big strings, but comparing 16B each time is better
for smaller strings. So after aligning the address to 16 Bytes, we check
more 176B in 16B chunks. There may be some overlaps with the main loop for
unaligned strings, but we avoid using the more aggressive strategy too soon,
and also allow the loop to start at a 64B-aligned address. This greatly
benefits smaller strings and avoids overlapping checks if the string is
already aligned at a 64B boundary.
3. Reduce dependencies between load blocks caused by address calculation on loop
Doing a precise time tracing on the code showed many loads in the loop were
stalled waiting for updates to r4 from previous code blocks. This
implementation avoids that as much as possible by using 2 registers (r4 and
r5) to hold addresses to be used by different parts of the code.
Also, the previous code aligned the address to 16B, then to 64B by doing a
few 48B loops (if needed) until the address was aligned. The main loop could
not start until that 48B loop had finished and r4 was updated with the
current address. Here we calculate the address used by the loop very early,
so it can start sooner.
The main loop now uses 2 pointers 128B apart to make pointer updates less
frequent, and also unrolls 1 iteration to guarantee there is enough time
between iterations to update the pointers, reducing stalled cycles.
4. Use new P10 instructions
lxvp is used to load 32B with a single instruction, reducing contention in
the load queue.
vextractbm allows simplifying the tail code for the loop, replacing
vbpermq and avoiding having to generate a permute control vector.
Reviewed-by: Paul E Murphy <murphyp@linux.ibm.com>
Reviewed-by: Raphael M Zinsly <rzinsly@linux.ibm.com>
Reviewed-by: Lucas A. M. Magalhaes <lamm@linux.ibm.com>
2020-09-29 18:40:08 +00:00
|
|
|
__strlen_power10)
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strlen, hwcap2 & PPC_FEATURE2_ARCH_3_00
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2020-05-18 16:16:06 +00:00
|
|
|
__strlen_power9)
|
|
|
|
|
#endif
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strlen, hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2015-11-11 19:31:28 +00:00
|
|
|
__strlen_power8)
|
2021-07-27 05:47:49 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strlen, hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:38:17 +00:00
|
|
|
__strlen_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strlen, 1,
|
|
|
|
|
__strlen_ppc))
|
2013-12-13 19:48:48 +00:00
|
|
|
|
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncmp.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strncmp,
|
2018-08-16 06:42:02 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncmp, hwcap2 & PPC_FEATURE2_ARCH_3_00
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2016-12-13 05:23:42 +00:00
|
|
|
__strncmp_power9)
|
2018-08-16 06:42:02 +00:00
|
|
|
#endif
|
2015-01-09 21:04:26 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncmp, hwcap2 & PPC_FEATURE2_ARCH_2_07,
|
|
|
|
|
__strncmp_power8)
|
2013-12-13 19:48:48 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncmp, 1,
|
|
|
|
|
__strncmp_ppc))
|
2013-12-13 19:49:54 +00:00
|
|
|
|
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strchr.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strchr,
|
2016-12-27 19:48:37 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strchr,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2016-12-27 19:48:37 +00:00
|
|
|
__strchr_power8)
|
2013-12-13 19:49:54 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strchr,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:49:54 +00:00
|
|
|
__strchr_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strchr, 1,
|
|
|
|
|
__strchr_ppc))
|
2013-12-13 19:50:26 +00:00
|
|
|
|
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strchrnul.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strchrnul,
|
2016-12-27 19:48:37 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strchrnul,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2016-12-27 19:48:37 +00:00
|
|
|
__strchrnul_power8)
|
2013-12-13 19:50:26 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strchrnul,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:50:26 +00:00
|
|
|
__strchrnul_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strchrnul, 1,
|
|
|
|
|
__strchrnul_ppc))
|
2013-12-13 19:31:41 +00:00
|
|
|
#endif
|
|
|
|
|
|
2013-12-13 19:32:31 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memcmp.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, memcmp,
|
2021-05-06 20:01:52 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcmp,
|
|
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_3_1
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
|
|
|
|
__memcmp_power10)
|
|
|
|
|
#endif
|
2021-07-27 05:47:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memcmp, hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2017-05-18 05:51:20 +00:00
|
|
|
__memcmp_power8)
|
2021-07-27 05:47:49 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memcmp, hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:32:31 +00:00
|
|
|
__memcmp_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcmp, hwcap & PPC_FEATURE_POWER4,
|
|
|
|
|
__memcmp_power4)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memcmp, 1, __memcmp_ppc))
|
|
|
|
|
|
2013-12-13 19:34:06 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/mempcpy.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, mempcpy,
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, mempcpy,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2013-12-13 19:34:06 +00:00
|
|
|
__mempcpy_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, mempcpy, 1,
|
|
|
|
|
__mempcpy_ppc))
|
|
|
|
|
|
2013-12-13 19:35:28 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memchr.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, memchr,
|
2017-06-21 05:25:12 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memchr,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2017-06-21 05:25:12 +00:00
|
|
|
__memchr_power8)
|
2013-12-13 19:35:28 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memchr,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:35:28 +00:00
|
|
|
__memchr_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memchr, 1,
|
|
|
|
|
__memchr_ppc))
|
|
|
|
|
|
2013-12-13 19:36:50 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/memrchr.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, memrchr,
|
2017-10-02 12:01:13 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memrchr,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2017-10-02 12:01:13 +00:00
|
|
|
__memrchr_power8)
|
2013-12-13 19:36:50 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, memrchr,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:36:50 +00:00
|
|
|
__memrchr_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, memrchr, 1,
|
|
|
|
|
__memrchr_ppc))
|
|
|
|
|
|
2013-12-13 19:37:26 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/rawmemchr.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, rawmemchr,
|
2020-05-14 11:49:16 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
powerpc: Add optimized rawmemchr for POWER10
Reuse code for optimized strlen to implement a faster version of rawmemchr.
This takes advantage of the same benefits provided by the strlen implementation,
but needs some extra steps. __strlen_power10 code should be unchanged after this
change.
rawmemchr returns a pointer to the char found, while strlen returns only the
length, so we have to take that into account when preparing the return value.
To quickly check 64B, the loop on __strlen_power10 merges the whole block into
16B by using unsigned minimum vector operations (vminub) and checks if there are
any \0 on the resulting vector. The same code is used by rawmemchr if the char c
is 0. However, this approach does not work when c != 0. We first need to
subtract each byte by c, so that the value we are looking for is converted to a
0, then taking the minimum and checking for nulls works again.
The new code branches after it has compared ~256 bytes and chooses which of the
two strategies above will be used in the main loop, based on the char c. This
extra branch adds some overhead (~5%) for length ~256, but is quickly amortized
by the faster loop for larger sizes.
Compared to __rawmemchr_power9, this version is ~20% faster for length < 256.
Because of the optimized main loop, the improvement becomes ~35% for c != 0
and ~50% for c = 0 for strings longer than 256.
Reviewed-by: Lucas A. M. Magalhaes <lamm@linux.ibm.com>
Reviewed-by: Raphael M Zinsly <rzinsly@linux.ibm.com>
2021-05-11 20:53:07 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, rawmemchr,
|
|
|
|
|
(hwcap2 & PPC_FEATURE2_ARCH_3_1)
|
|
|
|
|
&& (hwcap & PPC_FEATURE_HAS_VSX),
|
|
|
|
|
__rawmemchr_power10)
|
2020-05-14 11:49:16 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, rawmemchr,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_3_00
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2020-05-14 11:49:16 +00:00
|
|
|
__rawmemchr_power9)
|
|
|
|
|
#endif
|
2013-12-13 19:37:26 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, rawmemchr,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:37:26 +00:00
|
|
|
__rawmemchr_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, rawmemchr, 1,
|
|
|
|
|
__rawmemchr_ppc))
|
|
|
|
|
|
2013-12-13 19:38:50 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strnlen.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strnlen,
|
2017-04-05 13:24:24 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strnlen,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2017-04-05 13:24:24 +00:00
|
|
|
__strnlen_power8)
|
2021-07-27 05:47:49 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strnlen, hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:38:50 +00:00
|
|
|
__strnlen_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strnlen, 1,
|
|
|
|
|
__strnlen_ppc))
|
|
|
|
|
|
2013-12-13 19:39:51 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcasecmp.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strcasecmp,
|
2016-06-14 09:21:16 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2016-06-14 09:21:16 +00:00
|
|
|
__strcasecmp_power8)
|
2013-12-13 19:39:51 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:39:51 +00:00
|
|
|
__strcasecmp_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp, 1, __strcasecmp_ppc))
|
|
|
|
|
|
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcasecmp_l.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strcasecmp_l,
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:39:51 +00:00
|
|
|
__strcasecmp_l_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcasecmp_l, 1,
|
|
|
|
|
__strcasecmp_l_ppc))
|
|
|
|
|
|
2013-12-13 19:40:28 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncase.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strncasecmp,
|
2016-06-14 09:21:16 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2016-06-14 09:21:16 +00:00
|
|
|
__strncasecmp_power8)
|
2013-12-13 19:40:28 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:40:28 +00:00
|
|
|
__strncasecmp_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp, 1, __strncasecmp_ppc))
|
|
|
|
|
|
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncase_l.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strncasecmp_l,
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2013-12-13 19:40:28 +00:00
|
|
|
__strncasecmp_l_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strncasecmp_l, 1,
|
|
|
|
|
__strncasecmp_l_ppc))
|
|
|
|
|
|
2014-03-03 14:06:41 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strrchr.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strrchr,
|
2017-04-18 05:58:56 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strrchr,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2017-04-18 05:58:56 +00:00
|
|
|
__strrchr_power8)
|
2014-03-03 14:06:41 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strrchr,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2014-03-03 14:06:41 +00:00
|
|
|
__strrchr_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strrchr, 1,
|
|
|
|
|
__strrchr_ppc))
|
|
|
|
|
|
2014-03-07 12:09:47 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncat.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strncat,
|
2017-04-13 05:59:20 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncat,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2017-04-13 05:59:20 +00:00
|
|
|
__strncat_power8)
|
2014-03-07 12:09:47 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncat,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2014-03-07 12:09:47 +00:00
|
|
|
__strncat_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strncat, 1,
|
|
|
|
|
__strncat_ppc))
|
|
|
|
|
|
2014-05-06 00:10:45 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strncpy.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strncpy,
|
2020-11-12 16:12:24 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strncpy,
|
|
|
|
|
(hwcap2 & PPC_FEATURE2_ARCH_3_00)
|
|
|
|
|
&& (hwcap & PPC_FEATURE_HAS_VSX),
|
|
|
|
|
__strncpy_power9)
|
|
|
|
|
#endif
|
2014-12-31 16:47:41 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncpy,
|
|
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07,
|
|
|
|
|
__strncpy_power8)
|
2014-05-06 00:10:45 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strncpy,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2014-05-06 00:10:45 +00:00
|
|
|
__strncpy_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strncpy, 1,
|
|
|
|
|
__strncpy_ppc))
|
|
|
|
|
|
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/stpncpy.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, stpncpy,
|
2020-11-12 16:12:24 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, stpncpy,
|
|
|
|
|
(hwcap2 & PPC_FEATURE2_ARCH_3_00)
|
|
|
|
|
&& (hwcap & PPC_FEATURE_HAS_VSX),
|
|
|
|
|
__stpncpy_power9)
|
|
|
|
|
#endif
|
2014-12-31 16:47:41 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, stpncpy,
|
|
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07,
|
|
|
|
|
__stpncpy_power8)
|
2014-05-06 00:10:45 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, stpncpy,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2014-05-06 00:10:45 +00:00
|
|
|
__stpncpy_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, stpncpy, 1,
|
|
|
|
|
__stpncpy_ppc))
|
|
|
|
|
|
2014-06-06 12:56:07 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcmp.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strcmp,
|
2018-08-16 06:42:02 +00:00
|
|
|
#ifdef __LITTLE_ENDIAN__
|
2016-12-01 06:05:43 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcmp,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_3_00
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2016-12-01 06:05:43 +00:00
|
|
|
__strcmp_power9)
|
2018-08-16 06:42:02 +00:00
|
|
|
#endif
|
2015-01-07 12:18:30 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcmp,
|
|
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07,
|
|
|
|
|
__strcmp_power8)
|
2014-06-06 12:56:07 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcmp,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2014-06-06 12:56:07 +00:00
|
|
|
__strcmp_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcmp, 1,
|
|
|
|
|
__strcmp_ppc))
|
2014-06-12 03:21:20 +00:00
|
|
|
|
|
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcat.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strcat,
|
2014-12-23 18:36:34 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcat,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2014-12-23 18:36:34 +00:00
|
|
|
__strcat_power8)
|
2014-06-12 03:21:20 +00:00
|
|
|
IFUNC_IMPL_ADD (array, i, strcat,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2014-06-12 03:21:20 +00:00
|
|
|
__strcat_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcat, 1,
|
|
|
|
|
__strcat_ppc))
|
|
|
|
|
|
2016-03-14 21:40:46 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strspn.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strspn,
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strspn,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2016-03-14 21:40:46 +00:00
|
|
|
__strspn_power8)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strspn, 1,
|
|
|
|
|
__strspn_ppc))
|
|
|
|
|
|
2016-04-25 14:11:02 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcspn.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strcspn,
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcspn,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_VSX,
|
2016-04-25 14:11:02 +00:00
|
|
|
__strcspn_power8)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcspn, 1,
|
|
|
|
|
__strcspn_ppc))
|
|
|
|
|
|
2015-06-24 06:08:21 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strstr.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strstr,
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strstr,
|
2021-07-27 05:47:49 +00:00
|
|
|
hwcap & PPC_FEATURE_ARCH_2_06,
|
2015-06-24 06:08:21 +00:00
|
|
|
__strstr_power7)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strstr, 1,
|
|
|
|
|
__strstr_ppc))
|
|
|
|
|
|
|
|
|
|
|
2016-04-20 17:40:42 +00:00
|
|
|
/* Support sysdeps/powerpc/powerpc64/multiarch/strcasestr.c. */
|
|
|
|
|
IFUNC_IMPL (i, name, strcasestr,
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcasestr,
|
2021-07-27 05:47:51 +00:00
|
|
|
hwcap2 & PPC_FEATURE2_ARCH_2_07
|
|
|
|
|
&& hwcap & PPC_FEATURE_HAS_ALTIVEC,
|
2016-04-20 17:40:42 +00:00
|
|
|
__strcasestr_power8)
|
|
|
|
|
IFUNC_IMPL_ADD (array, i, strcasestr, 1,
|
|
|
|
|
__strcasestr_ppc))
|
|
|
|
|
|
2022-06-10 16:13:29 +00:00
|
|
|
return 0;
|
2013-12-13 19:31:41 +00:00
|
|
|
}
|