summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--llvm/lib/CodeGen/IfConversion.cpp10
-rw-r--r--llvm/lib/CodeGen/LivePhysRegs.cpp11
-rw-r--r--llvm/test/CodeGen/ARM/ifcvt-dead-def.ll55
3 files changed, 71 insertions, 5 deletions
diff --git a/llvm/lib/CodeGen/IfConversion.cpp b/llvm/lib/CodeGen/IfConversion.cpp
index 3ac78b25854..5df18fbe199 100644
--- a/llvm/lib/CodeGen/IfConversion.cpp
+++ b/llvm/lib/CodeGen/IfConversion.cpp
@@ -980,10 +980,10 @@ static void UpdatePredRedefs(MachineInstr *MI, LivePhysRegs &Redefs) {
// Now add the implicit uses for each of the clobbered values.
for (auto Reg : Clobbers) {
- const MachineOperand &Op = *Reg.second;
// FIXME: Const cast here is nasty, but better than making StepForward
// take a mutable instruction instead of const.
- MachineInstr *OpMI = const_cast<MachineInstr*>(Op.getParent());
+ MachineOperand &Op = const_cast<MachineOperand&>(*Reg.second);
+ MachineInstr *OpMI = Op.getParent();
MachineInstrBuilder MIB(*OpMI->getParent()->getParent(), OpMI);
if (Op.isRegMask()) {
// First handle regmasks. They clobber any entries in the mask which
@@ -999,6 +999,12 @@ static void UpdatePredRedefs(MachineInstr *MI, LivePhysRegs &Redefs) {
continue;
}
assert(Op.isReg() && "Register operand required");
+ if (Op.isDead()) {
+ // If we found a dead def, but it needs to be live, then remove the dead
+ // flag.
+ if (Redefs.contains(Op.getReg()))
+ Op.setIsDead(false);
+ }
MIB.addReg(Reg.first, RegState::Implicit | RegState::Undef);
}
}
diff --git a/llvm/lib/CodeGen/LivePhysRegs.cpp b/llvm/lib/CodeGen/LivePhysRegs.cpp
index b6369275051..eef7643367f 100644
--- a/llvm/lib/CodeGen/LivePhysRegs.cpp
+++ b/llvm/lib/CodeGen/LivePhysRegs.cpp
@@ -77,8 +77,9 @@ void LivePhysRegs::stepForward(const MachineInstr &MI,
if (Reg == 0)
continue;
if (O->isDef()) {
- if (!O->isDead())
- Clobbers.push_back(std::make_pair(Reg, &*O));
+ // Note, dead defs are still recorded. The caller should decide how to
+ // handle them.
+ Clobbers.push_back(std::make_pair(Reg, &*O));
} else {
if (!O->isKill())
continue;
@@ -90,8 +91,12 @@ void LivePhysRegs::stepForward(const MachineInstr &MI,
}
// Add defs to the set.
- for (auto Reg : Clobbers)
+ for (auto Reg : Clobbers) {
+ // Skip dead defs. They shouldn't be added to the set.
+ if (Reg.second->isReg() && Reg.second->isDead())
+ continue;
addReg(Reg.first);
+ }
}
/// Prin the currently live registers to OS.
diff --git a/llvm/test/CodeGen/ARM/ifcvt-dead-def.ll b/llvm/test/CodeGen/ARM/ifcvt-dead-def.ll
new file mode 100644
index 00000000000..77a3f5c0961
--- /dev/null
+++ b/llvm/test/CodeGen/ARM/ifcvt-dead-def.ll
@@ -0,0 +1,55 @@
+; RUN: llc %s -o - -verify-machineinstrs | FileCheck %s
+
+target datalayout = "e-m:o-p:32:32-f64:32:64-v64:32:64-v128:32:128-a:0:32-n32-S32"
+target triple = "thumbv7-unknown-unknown"
+
+%struct.ref_s = type { %union.v, i16, i16 }
+%union.v = type { i32 }
+%struct.gs_color_s = type { i16, i16, i16, i16, i8, i8 }
+
+; In this case, the if converter was cloning the return instruction so that we had
+; r2<def> = ...
+; return [pred] r2<dead,def>
+; ldr <r2, kill>
+; return
+; The problem here was that the dead def on the first return was making the machine verifier
+; think that the load read from an undefined register. We need to remove the dead flag from
+; the return, and also add an implicit use of the prior value of r2.
+
+; CHECK: ldrh
+
+; Function Attrs: minsize nounwind optsize ssp
+define i32 @test(%struct.ref_s* %pref1, %struct.ref_s* %pref2, %struct.gs_color_s** %tmp152) #0 {
+bb:
+ %nref = alloca %struct.ref_s, align 4
+ %tmp46 = call %struct.ref_s* @name_string_ref(%struct.ref_s* %pref1, %struct.ref_s* %nref) #2
+ %tmp153 = load %struct.gs_color_s*, %struct.gs_color_s** %tmp152, align 4
+ %tmp154 = bitcast %struct.ref_s* %pref2 to %struct.gs_color_s**
+ %tmp155 = load %struct.gs_color_s*, %struct.gs_color_s** %tmp154, align 4
+ %tmp162 = getelementptr inbounds %struct.gs_color_s, %struct.gs_color_s* %tmp153, i32 0, i32 1
+ %tmp163 = load i16, i16* %tmp162, align 2
+ %tmp164 = getelementptr inbounds %struct.gs_color_s, %struct.gs_color_s* %tmp155, i32 0, i32 1
+ %tmp165 = load i16, i16* %tmp164, align 2
+ %tmp166 = icmp eq i16 %tmp163, %tmp165
+ br i1 %tmp166, label %bb167, label %bb173
+
+bb167: ; preds = %bb
+ %tmp168 = getelementptr inbounds %struct.gs_color_s, %struct.gs_color_s* %tmp153, i32 0, i32 2
+ %tmp169 = load i16, i16* %tmp168, align 2
+ %tmp170 = getelementptr inbounds %struct.gs_color_s, %struct.gs_color_s* %tmp155, i32 0, i32 2
+ %tmp171 = load i16, i16* %tmp170, align 2
+ %tmp172 = icmp eq i16 %tmp169, %tmp171
+ br label %bb173
+
+bb173: ; preds = %bb167, %bb
+ %tmp174 = phi i1 [ false, %bb ], [ %tmp172, %bb167 ]
+ %tmp175 = zext i1 %tmp174 to i32
+ ret i32 %tmp175
+}
+
+; Function Attrs: minsize optsize
+declare %struct.ref_s* @name_string_ref(%struct.ref_s*, %struct.ref_s*) #1
+
+attributes #0 = { minsize nounwind optsize }
+attributes #1 = { minsize optsize }
+attributes #2 = { minsize nounwind optsize }
OpenPOWER on IntegriCloud