diff options
| author | Stanislav Mekhanoshin <Stanislav.Mekhanoshin@amd.com> | 2019-10-18 22:48:45 +0000 |
|---|---|---|
| committer | Stanislav Mekhanoshin <Stanislav.Mekhanoshin@amd.com> | 2019-10-18 22:48:45 +0000 |
| commit | 0fab220eb5882ef451d039d5251a0a1298121f63 (patch) | |
| tree | 9ff30b1e8195121d66cc5d048779a1660eaf79e8 /llvm/lib/Target | |
| parent | 0b7f320c3acb4ed75e5b3acf3460176b5b20b1aa (diff) | |
| download | bcm5719-llvm-0fab220eb5882ef451d039d5251a0a1298121f63.tar.gz bcm5719-llvm-0fab220eb5882ef451d039d5251a0a1298121f63.zip | |
[AMDGPU] move PHI nodes to AGPR class
If all uses of a PHI are in AGPR register class we should
avoid unneeded copies via VGPRs.
Differential Revision: https://reviews.llvm.org/D69200
llvm-svn: 375297
Diffstat (limited to 'llvm/lib/Target')
| -rw-r--r-- | llvm/lib/Target/AMDGPU/SIFixSGPRCopies.cpp | 21 |
1 files changed, 16 insertions, 5 deletions
diff --git a/llvm/lib/Target/AMDGPU/SIFixSGPRCopies.cpp b/llvm/lib/Target/AMDGPU/SIFixSGPRCopies.cpp index b3a76aa4046..65286751c12 100644 --- a/llvm/lib/Target/AMDGPU/SIFixSGPRCopies.cpp +++ b/llvm/lib/Target/AMDGPU/SIFixSGPRCopies.cpp @@ -757,6 +757,7 @@ bool SIFixSGPRCopies::runOnMachineFunction(MachineFunction &MF) { void SIFixSGPRCopies::processPHINode(MachineInstr &MI) { unsigned numVGPRUses = 0; + bool AllAGPRUses = true; SetVector<const MachineInstr *> worklist; SmallSet<const MachineInstr *, 4> Visited; worklist.insert(&MI); @@ -766,6 +767,9 @@ void SIFixSGPRCopies::processPHINode(MachineInstr &MI) { unsigned Reg = Instr->getOperand(0).getReg(); for (const auto &Use : MRI->use_operands(Reg)) { const MachineInstr *UseMI = Use.getParent(); + AllAGPRUses &= (UseMI->isCopy() && + TRI->isAGPR(*MRI, UseMI->getOperand(0).getReg())) || + TRI->isAGPR(*MRI, Use.getReg()); if (UseMI->isCopy() || UseMI->isRegSequence()) { if (UseMI->isCopy() && UseMI->getOperand(0).getReg().isPhysical() && @@ -794,11 +798,19 @@ void SIFixSGPRCopies::processPHINode(MachineInstr &MI) { } } } + + Register PHIRes = MI.getOperand(0).getReg(); + const TargetRegisterClass *RC0 = MRI->getRegClass(PHIRes); + if (AllAGPRUses && numVGPRUses && !TRI->hasAGPRs(RC0)) { + LLVM_DEBUG(dbgs() << "Moving PHI to AGPR: " << MI); + MRI->setRegClass(PHIRes, TRI->getEquivalentAGPRClass(RC0)); + } + bool hasVGPRInput = false; for (unsigned i = 1; i < MI.getNumOperands(); i += 2) { unsigned InputReg = MI.getOperand(i).getReg(); MachineInstr *Def = MRI->getVRegDef(InputReg); - if (TRI->isVGPR(*MRI, InputReg)) { + if (TRI->isVectorRegister(*MRI, InputReg)) { if (Def->isCopy()) { unsigned SrcReg = Def->getOperand(1).getReg(); const TargetRegisterClass *RC = @@ -810,15 +822,14 @@ void SIFixSGPRCopies::processPHINode(MachineInstr &MI) { break; } else if (Def->isCopy() && - TRI->isVGPR(*MRI, Def->getOperand(1).getReg())) { + TRI->isVectorRegister(*MRI, Def->getOperand(1).getReg())) { hasVGPRInput = true; break; } } - unsigned PHIRes = MI.getOperand(0).getReg(); - const TargetRegisterClass *RC0 = MRI->getRegClass(PHIRes); - if ((!TRI->isVGPR(*MRI, PHIRes) && RC0 != &AMDGPU::VReg_1RegClass) && + if ((!TRI->isVectorRegister(*MRI, PHIRes) && + RC0 != &AMDGPU::VReg_1RegClass) && (hasVGPRInput || numVGPRUses > 1)) { LLVM_DEBUG(dbgs() << "Fixing PHI: " << MI); TII->moveToVALU(MI); |

