aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorAndrew Trick <atrick@apple.com>2011-09-15 01:09:33 +0000
committerAndrew Trick <atrick@apple.com>2011-09-15 01:09:33 +0000
commitb1afbac64b7c4c06959350acc175fb3552012f57 (patch)
tree20d54cdd0eba1c8071a9625fb4236f1eccdfa834
parent322ea080ada5608de41f82127f053f754e459910 (diff)
downloadexternal_llvm-b1afbac64b7c4c06959350acc175fb3552012f57.zip
external_llvm-b1afbac64b7c4c06959350acc175fb3552012f57.tar.gz
external_llvm-b1afbac64b7c4c06959350acc175fb3552012f57.tar.bz2
[regcoalescing] bug fix for RegistersDefinedFromSameValue.
An improper SlotIndex->VNInfo lookup was leading to unsafe copy removal. Fixes PR10920 401.bzip2 miscompile with no IV rewrite. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@139765 91177308-0d34-0410-b5e6-96231b3b80d8
-rw-r--r--include/llvm/CodeGen/LiveInterval.h8
-rw-r--r--lib/CodeGen/RegisterCoalescer.cpp7
-rw-r--r--test/CodeGen/X86/2011-09-14-valcoalesce.ll115
3 files changed, 128 insertions, 2 deletions
diff --git a/include/llvm/CodeGen/LiveInterval.h b/include/llvm/CodeGen/LiveInterval.h
index 4041172..0daaf82 100644
--- a/include/llvm/CodeGen/LiveInterval.h
+++ b/include/llvm/CodeGen/LiveInterval.h
@@ -411,6 +411,14 @@ namespace llvm {
return I == end() ? 0 : I->valno;
}
+ /// getVNInfoBefore - Return the VNInfo that is live up to but not
+ /// necessarilly including Idx, or NULL. Use this to find the reaching def
+ /// used by an instruction at this SlotIndex position.
+ VNInfo *getVNInfoBefore(SlotIndex Idx) const {
+ const_iterator I = FindLiveRangeContaining(Idx.getPrevIndex());
+ return I == end() ? 0 : I->valno;
+ }
+
/// FindLiveRangeContaining - Return an iterator to the live range that
/// contains the specified index, or end() if there is none.
iterator FindLiveRangeContaining(SlotIndex Idx) {
diff --git a/lib/CodeGen/RegisterCoalescer.cpp b/lib/CodeGen/RegisterCoalescer.cpp
index 62d6306..f3b8ae3 100644
--- a/lib/CodeGen/RegisterCoalescer.cpp
+++ b/lib/CodeGen/RegisterCoalescer.cpp
@@ -692,7 +692,7 @@ bool RegisterCoalescer::RemoveCopyByCommutingDef(const CoalescerPair &CP,
// If some of the uses of IntA.reg is already coalesced away, return false.
// It's not possible to determine whether it's safe to perform the coalescing.
- for (MachineRegisterInfo::use_nodbg_iterator UI =
+ for (MachineRegisterInfo::use_nodbg_iterator UI =
MRI->use_nodbg_begin(IntA.reg),
UE = MRI->use_nodbg_end(); UI != UE; ++UI) {
MachineInstr *UseMI = &*UI;
@@ -1370,6 +1370,7 @@ static unsigned ComputeUltimateVN(VNInfo *VNI,
// which allows us to coalesce A and B.
// VNI is the definition of B. LR is the life range of A that includes
// the slot just before B. If we return true, we add "B = X" to DupCopies.
+// This implies that A dominates B.
static bool RegistersDefinedFromSameValue(LiveIntervals &li,
const TargetRegisterInfo &tri,
CoalescerPair &CP,
@@ -1421,7 +1422,9 @@ static bool RegistersDefinedFromSameValue(LiveIntervals &li,
// If the copies use two different value numbers of X, we cannot merge
// A and B.
LiveInterval &SrcInt = li.getInterval(Src);
- if (SrcInt.getVNInfoAt(Other->def) != SrcInt.getVNInfoAt(VNI->def))
+ // getVNInfoBefore returns NULL for undef copies. In this case, the
+ // optimization is still safe.
+ if (SrcInt.getVNInfoBefore(Other->def) != SrcInt.getVNInfoBefore(VNI->def))
return false;
DupCopies.push_back(MI);
diff --git a/test/CodeGen/X86/2011-09-14-valcoalesce.ll b/test/CodeGen/X86/2011-09-14-valcoalesce.ll
new file mode 100644
index 0000000..4c3f789
--- /dev/null
+++ b/test/CodeGen/X86/2011-09-14-valcoalesce.ll
@@ -0,0 +1,115 @@
+; RUN: llc < %s -march=x86
+;
+; Test RegistersDefinedFromSameValue. We have multiple copies of the same vreg:
+; while.body85.i:
+; vreg1 = copy vreg2
+; vreg2 = add
+; critical edge from land.lhs.true.i -> if.end117.i:
+; vreg27 = vreg2
+; critical edge from land.lhs.true103.i -> if.end117.i:
+; vreg27 = vreg2
+; if.then108.i:
+; vreg27 = vreg1
+;
+; Prior to fixing PR10920 401.bzip miscompile, the coalescer would
+; consider vreg1 and vreg27 to be copies of the same value. It would
+; then remove one of the critical edge copes, which cannot safely be removed.
+
+target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:64:64-v128:128:128-a0:0:64-f80:128:128-n8:16:32"
+
+@.str3 = external unnamed_addr constant [59 x i8], align 1
+
+define void @test() nounwind ssp {
+entry:
+ br i1 undef, label %if.then68, label %if.end85
+
+if.then68: ; preds = %entry
+ br label %for.body.i.i
+
+for.body.i.i: ; preds = %for.inc.i.i, %if.then68
+ br i1 undef, label %for.inc.i.i, label %if.then.i.i
+
+if.then.i.i: ; preds = %for.body.i.i
+ br label %for.inc.i.i
+
+for.inc.i.i: ; preds = %if.then.i.i, %for.body.i.i
+ br i1 undef, label %makeMaps_e.exit.i, label %for.body.i.i
+
+makeMaps_e.exit.i: ; preds = %for.inc.i.i
+ br i1 undef, label %for.cond19.preheader.i, label %for.cond.for.cond19.preheader_crit_edge.i
+
+for.cond.for.cond19.preheader_crit_edge.i: ; preds = %makeMaps_e.exit.i
+ unreachable
+
+for.cond19.preheader.i: ; preds = %makeMaps_e.exit.i
+ br i1 undef, label %if.then.i, label %if.end.i
+
+if.then.i: ; preds = %for.cond19.preheader.i
+ br label %if.end.i
+
+if.end.i: ; preds = %if.then.i, %for.cond19.preheader.i
+ br i1 undef, label %for.inc27.us.5.i, label %for.end30.i
+
+for.end30.i: ; preds = %if.end.i
+ br i1 undef, label %if.end36.i, label %if.then35.i
+
+if.then35.i: ; preds = %for.end30.i
+ unreachable
+
+if.end36.i: ; preds = %for.end30.i
+ br label %while.body.i188
+
+for.cond182.preheader.i: ; preds = %for.cond138.preheader.i
+ unreachable
+
+while.body.i188: ; preds = %for.cond138.preheader.i, %if.end36.i
+ %sub.i187 = add nsw i32 0, -1
+ br i1 undef, label %while.body85.i, label %if.end117.i
+
+while.body85.i: ; preds = %while.body85.i, %while.body.i188
+ %ge.0519.i = phi i32 [ %inc87.i, %while.body85.i ], [ %sub.i187, %while.body.i188 ]
+ %aFreq.0518.i = phi i32 [ %add93.i, %while.body85.i ], [ 0, %while.body.i188 ]
+ %inc87.i = add nsw i32 %ge.0519.i, 1
+ %tmp91.i = load i32* undef, align 4, !tbaa !0
+ %add93.i = add nsw i32 %tmp91.i, %aFreq.0518.i
+ %cmp84.i = icmp slt i32 %inc87.i, undef
+ %or.cond514.i = and i1 undef, %cmp84.i
+ br i1 %or.cond514.i, label %while.body85.i, label %while.end.i
+
+while.end.i: ; preds = %while.body85.i
+ br i1 undef, label %land.lhs.true.i, label %if.end117.i
+
+land.lhs.true.i: ; preds = %while.end.i
+ br i1 undef, label %if.end117.i, label %land.lhs.true103.i
+
+land.lhs.true103.i: ; preds = %land.lhs.true.i
+ br i1 undef, label %if.then108.i, label %if.end117.i
+
+if.then108.i: ; preds = %land.lhs.true103.i
+ br label %if.end117.i
+
+if.end117.i: ; preds = %if.then108.i, %land.lhs.true103.i, %land.lhs.true.i, %while.end.i, %while.body.i188
+ %aFreq.1.i = phi i32 [ %aFreq.0518.i, %if.then108.i ], [ %add93.i, %land.lhs.true103.i ], [ %add93.i, %while.end.i ], [ 0, %while.body.i188 ], [ %add93.i, %land.lhs.true.i ]
+ %cmp121.i = icmp sgt i32 undef, 2
+ br i1 %cmp121.i, label %if.then122.i, label %for.cond138.preheader.i
+
+if.then122.i: ; preds = %if.end117.i
+ call void (...)* @fprintf(i32 undef, i32 0, i32 undef, i32 %aFreq.1.i, double undef) nounwind
+ unreachable
+
+for.cond138.preheader.i: ; preds = %if.end117.i
+ %cmp73.i = icmp sgt i32 undef, 0
+ br i1 %cmp73.i, label %while.body.i188, label %for.cond182.preheader.i
+
+for.inc27.us.5.i: ; preds = %if.end.i
+ unreachable
+
+if.end85: ; preds = %entry
+ ret void
+}
+
+declare void @fprintf(...) nounwind
+
+!0 = metadata !{metadata !"int", metadata !1}
+!1 = metadata !{metadata !"omnipotent char", metadata !2}
+!2 = metadata !{metadata !"Simple C/C++ TBAA", null}