diff options
| author | Stanislav Mekhanoshin <Stanislav.Mekhanoshin@amd.com> | 2017-04-06 16:48:30 +0000 | 
|---|---|---|
| committer | Stanislav Mekhanoshin <Stanislav.Mekhanoshin@amd.com> | 2017-04-06 16:48:30 +0000 | 
| commit | ea57c38521d46fe4a8ae2d1172d25538a88d4431 (patch) | |
| tree | f8848ebe196295e32e1b209346c5a78196231ed0 /llvm/lib/Target | |
| parent | 3fc1225c1851a2511bade654751e1ed42dda3653 (diff) | |
| download | bcm5719-llvm-ea57c38521d46fe4a8ae2d1172d25538a88d4431.tar.gz bcm5719-llvm-ea57c38521d46fe4a8ae2d1172d25538a88d4431.zip | |
[AMDGPU] Eliminate barrier if workgroup size is not greater than wavefront size
If a workgroup size is known to be not greater than wavefront size
the s_barrier instruction is not needed since all threads are guarantied
to come to the same point at the same time.
Differential Revision: https://reviews.llvm.org/D31731
llvm-svn: 299659
Diffstat (limited to 'llvm/lib/Target')
| -rw-r--r-- | llvm/lib/Target/AMDGPU/SIISelLowering.cpp | 11 | 
1 files changed, 11 insertions, 0 deletions
| diff --git a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp index 36f16e3ca9a..3052439358a 100644 --- a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp +++ b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp @@ -3159,6 +3159,17 @@ SDValue SITargetLowering::LowerINTRINSIC_VOID(SDValue Op,      SDValue Cast = DAG.getNode(ISD::BITCAST, DL, MVT::i32, Src);      return DAG.getNode(AMDGPUISD::KILL, DL, MVT::Other, Chain, Cast);    } +  case Intrinsic::amdgcn_s_barrier: { +    if (getTargetMachine().getOptLevel() > CodeGenOpt::None) { +      const MachineFunction &MF = DAG.getMachineFunction(); +      const SISubtarget &ST = MF.getSubtarget<SISubtarget>(); +      unsigned WGSize = ST.getFlatWorkGroupSizes(*MF.getFunction()).second; +      if (WGSize <= ST.getWavefrontSize()) +        return SDValue(DAG.getMachineNode(AMDGPU::WAVE_BARRIER, DL, MVT::Other, +                                          Op.getOperand(0)), 0); +    } +    return SDValue(); +  };    default:      return Op;    } | 

