aboutsummaryrefslogtreecommitdiffstats
path: root/test/CodeGen/X86/break-avx-dep.ll
diff options
context:
space:
mode:
authorAndrew Trick <atrick@apple.com>2013-10-15 03:39:43 +0000
committerAndrew Trick <atrick@apple.com>2013-10-15 03:39:43 +0000
commit51dee24ca6ba63cf021d56ca9cbae62c739d5041 (patch)
tree5ee39c0ca82e1099827441eada176b62d50a8e35 /test/CodeGen/X86/break-avx-dep.ll
parentcc3d76d98259ef82c9592022cb0e31fb42b36ab6 (diff)
downloadexternal_llvm-51dee24ca6ba63cf021d56ca9cbae62c739d5041.zip
external_llvm-51dee24ca6ba63cf021d56ca9cbae62c739d5041.tar.gz
external_llvm-51dee24ca6ba63cf021d56ca9cbae62c739d5041.tar.bz2
Improve on r192635, ExeDepsFix for avx, and add a test case.
rdar:15221834 False AVX register dependencies cause 5x slowdown on flops-5/6 and significant slowdown on several others. This was blocking the switch to MI-Sched. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@192669 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'test/CodeGen/X86/break-avx-dep.ll')
-rw-r--r--test/CodeGen/X86/break-avx-dep.ll29
1 files changed, 29 insertions, 0 deletions
diff --git a/test/CodeGen/X86/break-avx-dep.ll b/test/CodeGen/X86/break-avx-dep.ll
new file mode 100644
index 0000000..eea7d15
--- /dev/null
+++ b/test/CodeGen/X86/break-avx-dep.ll
@@ -0,0 +1,29 @@
+; RUN: llc < %s -march=x86-64 -mattr=+avx | FileCheck %s
+;
+; rdar:15221834 False AVX register dependencies cause 5x slowdown on
+; flops-6. Make sure the unused register read by vcvtsi2sdq is zeroed
+; to avoid cyclic dependence on a write to the same register in a
+; previous iteration.
+
+; CHECK-LABEL: t1:
+; CHECK-LABEL: %loop
+; CHECK: vxorps %[[REG:xmm.]], %{{xmm.}}, %{{xmm.}}
+; CHECK: vcvtsi2sdq %{{r..}}, %[[REG]], %{{xmm.}}
+define i64 @t1(i64* nocapture %x, double* nocapture %y) nounwind {
+entry:
+ %vx = load i64* %x
+ br label %loop
+loop:
+ %i = phi i64 [ 1, %entry ], [ %inc, %loop ]
+ %s1 = phi i64 [ %vx, %entry ], [ %s2, %loop ]
+ %fi = sitofp i64 %i to double
+ %vy = load double* %y
+ %fipy = fadd double %fi, %vy
+ %iipy = fptosi double %fipy to i64
+ %s2 = add i64 %s1, %iipy
+ %inc = add nsw i64 %i, 1
+ %exitcond = icmp eq i64 %inc, 156250000
+ br i1 %exitcond, label %ret, label %loop
+ret:
+ ret i64 %s2
+}