summaryrefslogtreecommitdiffstats
path: root/llvm/lib/Target/R600/SIInsertWaits.cpp
diff options
context:
space:
mode:
authorTom Stellard <thomas.stellard@amd.com>2015-01-06 19:52:07 +0000
committerTom Stellard <thomas.stellard@amd.com>2015-01-06 19:52:07 +0000
commit9d6797ae5804e4bf9a0a760d136d4b6a28b47b83 (patch)
treefaf88ff2b7d22e68157bc65910ef800d64e69c74 /llvm/lib/Target/R600/SIInsertWaits.cpp
parentb3931b814adc8a6c3d6b8b1d6a2a0faa6d4cdc52 (diff)
downloadbcm5719-llvm-9d6797ae5804e4bf9a0a760d136d4b6a28b47b83.tar.gz
bcm5719-llvm-9d6797ae5804e4bf9a0a760d136d4b6a28b47b83.zip
R600/SI: Insert s_waitcnt before s_barrier instructions.
This ensures that all memory operations are complete when all threads reach the barrier. llvm-svn: 225290
Diffstat (limited to 'llvm/lib/Target/R600/SIInsertWaits.cpp')
-rw-r--r--llvm/lib/Target/R600/SIInsertWaits.cpp6
1 files changed, 5 insertions, 1 deletions
diff --git a/llvm/lib/Target/R600/SIInsertWaits.cpp b/llvm/lib/Target/R600/SIInsertWaits.cpp
index 2e56508e2fa..181b11643bf 100644
--- a/llvm/lib/Target/R600/SIInsertWaits.cpp
+++ b/llvm/lib/Target/R600/SIInsertWaits.cpp
@@ -428,7 +428,11 @@ bool SIInsertWaits::runOnMachineFunction(MachineFunction &MF) {
for (MachineBasicBlock::iterator I = MBB.begin(), E = MBB.end();
I != E; ++I) {
- Changes |= insertWait(MBB, I, handleOperands(*I));
+ // Wait for everything before a barrier.
+ if (I->getOpcode() == AMDGPU::S_BARRIER)
+ Changes |= insertWait(MBB, I, LastIssued);
+ else
+ Changes |= insertWait(MBB, I, handleOperands(*I));
pushInstruction(MBB, I);
}
OpenPOWER on IntegriCloud