summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorPuyan Lotfi <puyan@puyan.org>2018-04-05 00:08:15 +0000
committerPuyan Lotfi <puyan@puyan.org>2018-04-05 00:08:15 +0000
commit26c504fe1e066b9a263b8f7d124d0f0d3a30a715 (patch)
treecc5365492e5088e4096d9b41a7f128245f2b9572
parent7bd45502fea71ea1e944e8534582c5143f11b52e (diff)
downloadbcm5719-llvm-26c504fe1e066b9a263b8f7d124d0f0d3a30a715.tar.gz
bcm5719-llvm-26c504fe1e066b9a263b8f7d124d0f0d3a30a715.zip
[MIR-Canon] Adding support for multi-def -> user distance reduction.
llvm-svn: 329243
-rw-r--r--llvm/lib/CodeGen/MIRCanonicalizerPass.cpp17
-rw-r--r--llvm/test/CodeGen/MIR/AMDGPU/mir-canon-multi.mir32
2 files changed, 49 insertions, 0 deletions
diff --git a/llvm/lib/CodeGen/MIRCanonicalizerPass.cpp b/llvm/lib/CodeGen/MIRCanonicalizerPass.cpp
index bd939fdf104..9ef097c97e7 100644
--- a/llvm/lib/CodeGen/MIRCanonicalizerPass.cpp
+++ b/llvm/lib/CodeGen/MIRCanonicalizerPass.cpp
@@ -189,6 +189,7 @@ static bool rescheduleCanonically(unsigned &PseudoIdempotentInstCount,
Instructions.push_back(&MI);
}
+ std::map<MachineInstr *, std::vector<MachineInstr *>> MultiUsers;
std::vector<MachineInstr *> PseudoIdempotentInstructions;
std::vector<unsigned> PhysRegDefs;
for (auto *II : Instructions) {
@@ -297,10 +298,26 @@ static bool rescheduleCanonically(unsigned &PseudoIdempotentInstCount,
UseI->dump();
});
+ MultiUsers[UseToBringDefCloserTo].push_back(Def);
Changed = true;
MBB->splice(UseI, MBB, DefI);
}
+ // Sort the defs for users of multiple defs lexographically.
+ for (const auto &E : MultiUsers) {
+
+ auto UseI =
+ std::find_if(MBB->instr_begin(), MBB->instr_end(),
+ [&](MachineInstr &MI) -> bool { return &MI == E.first; });
+
+ if (UseI == MBB->instr_end())
+ continue;
+
+ DEBUG(dbgs() << "Rescheduling Multi-Use Instructions Lexographically.";);
+ Changed |= rescheduleLexographically(
+ E.second, MBB, [&]() -> MachineBasicBlock::iterator { return UseI; });
+ }
+
PseudoIdempotentInstCount = PseudoIdempotentInstructions.size();
DEBUG(dbgs() << "Rescheduling Idempotent Instructions Lexographically.";);
Changed |= rescheduleLexographically(
diff --git a/llvm/test/CodeGen/MIR/AMDGPU/mir-canon-multi.mir b/llvm/test/CodeGen/MIR/AMDGPU/mir-canon-multi.mir
new file mode 100644
index 00000000000..fd8d58527f7
--- /dev/null
+++ b/llvm/test/CodeGen/MIR/AMDGPU/mir-canon-multi.mir
@@ -0,0 +1,32 @@
+# RUN: llc -o - -march=amdgcn -run-pass mir-canonicalizer -x mir %s | FileCheck %s
+
+# CHECK: %1363:vgpr_32 = COPY %4354
+# CHECK: %1368:vgpr_32 = COPY %4355
+# CHECK: %1369:vgpr_32 = COPY %1372
+# CHECK: %1370:vgpr_32 = COPY %1373
+# CHECK: REG_SEQUENCE %1368, %subreg.sub0, %1363, %subreg.sub1
+# CHECK: REG_SEQUENCE %1368, %subreg.sub0, %1363, %subreg.sub1, %1369, %subreg.sub2, %1370, %subreg.sub3
+
+...
+---
+name: foo
+body: |
+ bb.0:
+ %10:sreg_32_xm0 = S_MOV_B32 61440
+ %11:sreg_32_xm0 = S_MOV_B32 0
+ %3:vgpr_32 = COPY $vgpr0
+
+ %vreg123_0:vgpr_32 = COPY %3
+ %0:sgpr_64 = COPY $sgpr0_sgpr1
+ %vreg123_1:vgpr_32 = COPY %11
+ %27:vreg_64 = REG_SEQUENCE %vreg123_0, %subreg.sub0, %vreg123_1, %subreg.sub1
+ %4:sreg_64_xexec = S_LOAD_DWORDX2_IMM %0, 9, 0
+ %vreg123_2:vgpr_32 = COPY %4
+ %5:sreg_64_xexec = S_LOAD_DWORDX2_IMM %0, 11, 0
+ %vreg123_3:vgpr_32 = COPY %5
+ %16:sgpr_128 = REG_SEQUENCE killed %vreg123_0, %subreg.sub0, %vreg123_1, %subreg.sub1, %vreg123_2, %subreg.sub2, %vreg123_3, %subreg.sub3
+
+ BUFFER_STORE_DWORD_ADDR64 %vreg123_1, %27, killed %16, 0, 0, 0, 0, 0, implicit $exec
+ S_ENDPGM
+
+...
OpenPOWER on IntegriCloud