about summary refs log tree commit diff
diff options
context:
space:
mode:
authorH.J. Lu <hjl.tools@gmail.com>2016-01-15 12:15:53 -0800
committerH.J. Lu <hjl.tools@gmail.com>2016-01-15 12:15:53 -0800
commit890a46047fc84a97aec0321c4e52de33ec0f00c1 (patch)
tree7fff02fc26bff456ea590ec9074ecc966687d145
parente70cffd77b34d2a02d634d33d11802b50899b78b (diff)
downloadglibc-890a46047fc84a97aec0321c4e52de33ec0f00c1.tar.gz
glibc-890a46047fc84a97aec0321c4e52de33ec0f00c1.tar.xz
glibc-890a46047fc84a97aec0321c4e52de33ec0f00c1.zip
Group prefetcht1
-rw-r--r--sysdeps/x86_64/multiarch/memcpy-avx512-no-vzeroupper.S16
1 files changed, 8 insertions, 8 deletions
diff --git a/sysdeps/x86_64/multiarch/memcpy-avx512-no-vzeroupper.S b/sysdeps/x86_64/multiarch/memcpy-avx512-no-vzeroupper.S
index b12c80e8ad..2c96046f52 100644
--- a/sysdeps/x86_64/multiarch/memcpy-avx512-no-vzeroupper.S
+++ b/sysdeps/x86_64/multiarch/memcpy-avx512-no-vzeroupper.S
@@ -345,14 +345,14 @@ L(preloop_large):
 	prefetcht1 0x80(%rsi)
 	prefetcht1 0xC0(%rsi)
 L(gobble_256bytes_nt_loop):
-	vmovdqu64	(%rsi), %zmm0
 	prefetcht1 0x100(%rsi)
-	vmovdqu64	0x40(%rsi), %zmm1
 	prefetcht1 0x140(%rsi)
-	vmovdqu64	0x80(%rsi), %zmm2
 	prefetcht1 0x180(%rsi)
-	vmovdqu64	0xC0(%rsi), %zmm3
 	prefetcht1 0x1C0(%rsi)
+	vmovdqu64	(%rsi), %zmm0
+	vmovdqu64	0x40(%rsi), %zmm1
+	vmovdqu64	0x80(%rsi), %zmm2
+	vmovdqu64	0xC0(%rsi), %zmm3
 	vmovntdq %zmm0, (%rdi)
 	vmovntdq %zmm1, 0x40(%rdi)
 	vmovntdq %zmm2, 0x80(%rdi)
@@ -383,14 +383,14 @@ L(preloop_large_bkw):
 	prefetcht1 -0x80(%rcx)
 	prefetcht1 -0x40(%rcx)
 L(gobble_256bytes_nt_loop_bkw):
-	vmovdqu64	-0x100(%rcx), %zmm0
 	prefetcht1 -0x200(%rcx)
-	vmovdqu64	-0xC0(%rcx), %zmm1
 	prefetcht1 -0x1C0(%rcx)
-	vmovdqu64	-0x80(%rcx), %zmm2
 	prefetcht1 -0x180(%rcx)
-	vmovdqu64	-0x40(%rcx), %zmm3
 	prefetcht1 -0x140(%rcx)
+	vmovdqu64	-0x100(%rcx), %zmm0
+	vmovdqu64	-0xC0(%rcx), %zmm1
+	vmovdqu64	-0x80(%rcx), %zmm2
+	vmovdqu64	-0x40(%rcx), %zmm3
 	vmovntdq %zmm0,	-0x100(%r9)
 	vmovntdq %zmm1,	-0xC0(%r9)
 	vmovntdq %zmm2,	-0x80(%r9)