about summary refs log tree commit diff
path: root/sysdeps/powerpc/powerpc64/multiarch/Makefile
diff options
context:
space:
mode:
authorTulio Magno Quites Machado Filho <tuliom@linux.ibm.com>2021-04-30 18:12:08 -0300
committerTulio Magno Quites Machado Filho <tuliom@linux.ibm.com>2021-04-30 18:12:08 -0300
commite941e0ae80626b7661c1db8953a673cafd3b8b19 (patch)
tree42b3dcccfce69af0f7ffb0fa4ed2ed75734b82a2 /sysdeps/powerpc/powerpc64/multiarch/Makefile
parentdd59655e9371af86043b97e38953f43bd9496699 (diff)
downloadglibc-e941e0ae80626b7661c1db8953a673cafd3b8b19.tar.gz
glibc-e941e0ae80626b7661c1db8953a673cafd3b8b19.tar.xz
glibc-e941e0ae80626b7661c1db8953a673cafd3b8b19.zip
powerpc64le: Optimize memcpy for POWER10
This implementation is based on __memcpy_power8_cached and integrates
suggestions from Anton Blanchard.
It benefits from loads and stores with length for short lengths and for
tail code, simplifying the code.

All unaligned memory accesses use instructions that do not generate
alignment interrupts on POWER10, making it safe to use on
caching-inhibited memory.

The main loop has also been modified in order to increase instruction
throughput by reducing the dependency on updates from previous iterations.

On average, this implementation provides around 30% improvement when
compared to __memcpy_power7 and 10% improvement in comparison to
__memcpy_power8_cached.
Diffstat (limited to 'sysdeps/powerpc/powerpc64/multiarch/Makefile')
-rw-r--r--sysdeps/powerpc/powerpc64/multiarch/Makefile2
1 files changed, 1 insertions, 1 deletions
diff --git a/sysdeps/powerpc/powerpc64/multiarch/Makefile b/sysdeps/powerpc/powerpc64/multiarch/Makefile
index a82219c490..9ef12d3563 100644
--- a/sysdeps/powerpc/powerpc64/multiarch/Makefile
+++ b/sysdeps/powerpc/powerpc64/multiarch/Makefile
@@ -32,7 +32,7 @@ sysdep_routines += memcpy-power8-cached memcpy-power7 memcpy-a2 memcpy-power6 \
 		   strncase-power8
 
 ifneq (,$(filter %le,$(config-machine)))
-sysdep_routines += memmove-power10 \
+sysdep_routines += memcpy-power10 memmove-power10 \
 		   strcmp-power9 strncmp-power9 strcpy-power9 stpcpy-power9 \
 		   rawmemchr-power9 strlen-power9 strncpy-power9 stpncpy-power9 \
 		   strlen-power10