diff options
author | Tom Stellard <thomas.stellard@amd.com> | 2015-01-06 19:52:07 +0000 |
---|---|---|
committer | Tom Stellard <thomas.stellard@amd.com> | 2015-01-06 19:52:07 +0000 |
commit | 9d6797ae5804e4bf9a0a760d136d4b6a28b47b83 (patch) | |
tree | faf88ff2b7d22e68157bc65910ef800d64e69c74 /llvm | |
parent | b3931b814adc8a6c3d6b8b1d6a2a0faa6d4cdc52 (diff) | |
download | bcm5719-llvm-9d6797ae5804e4bf9a0a760d136d4b6a28b47b83.tar.gz bcm5719-llvm-9d6797ae5804e4bf9a0a760d136d4b6a28b47b83.zip |
R600/SI: Insert s_waitcnt before s_barrier instructions.
This ensures that all memory operations are complete when all threads
reach the barrier.
llvm-svn: 225290
Diffstat (limited to 'llvm')
-rw-r--r-- | llvm/lib/Target/R600/SIInsertWaits.cpp | 6 | ||||
-rw-r--r-- | llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.global.ll | 2 | ||||
-rw-r--r-- | llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.local.ll | 3 |
3 files changed, 10 insertions, 1 deletions
diff --git a/llvm/lib/Target/R600/SIInsertWaits.cpp b/llvm/lib/Target/R600/SIInsertWaits.cpp index 2e56508e2fa..181b11643bf 100644 --- a/llvm/lib/Target/R600/SIInsertWaits.cpp +++ b/llvm/lib/Target/R600/SIInsertWaits.cpp @@ -428,7 +428,11 @@ bool SIInsertWaits::runOnMachineFunction(MachineFunction &MF) { for (MachineBasicBlock::iterator I = MBB.begin(), E = MBB.end(); I != E; ++I) { - Changes |= insertWait(MBB, I, handleOperands(*I)); + // Wait for everything before a barrier. + if (I->getOpcode() == AMDGPU::S_BARRIER) + Changes |= insertWait(MBB, I, LastIssued); + else + Changes |= insertWait(MBB, I, handleOperands(*I)); pushInstruction(MBB, I); } diff --git a/llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.global.ll b/llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.global.ll index 31e170948a0..a11d9ae7af0 100644 --- a/llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.global.ll +++ b/llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.global.ll @@ -3,6 +3,8 @@ ; FUNC-LABEL: {{^}}test_barrier_global: ; EG: GROUP_BARRIER +; SI: buffer_store_dword +; SI: s_waitcnt ; SI: s_barrier define void @test_barrier_global(i32 addrspace(1)* %out) { diff --git a/llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.local.ll b/llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.local.ll index 94b3cbc86eb..76c2453d089 100644 --- a/llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.local.ll +++ b/llvm/test/CodeGen/R600/llvm.AMDGPU.barrier.local.ll @@ -3,6 +3,9 @@ ; FUNC-LABEL: {{^}}test_barrier_local: ; EG: GROUP_BARRIER + +; SI: buffer_store_dword +; SI: s_waitcnt ; SI: s_barrier define void @test_barrier_local(i32 addrspace(1)* %out) { |