summaryrefslogtreecommitdiffstats
path: root/llvm/lib/Target/AMDGPU/SIISelLowering.cpp
diff options
context:
space:
mode:
authorStanislav Mekhanoshin <Stanislav.Mekhanoshin@amd.com>2018-02-14 18:05:14 +0000
committerStanislav Mekhanoshin <Stanislav.Mekhanoshin@amd.com>2018-02-14 18:05:14 +0000
commitc078ca92ebe20fd497d9da68bc4b99fd2163f097 (patch)
tree9424d7cbb2a4082618f6a115692da78d0af196bf /llvm/lib/Target/AMDGPU/SIISelLowering.cpp
parentcbecfdfefe11ddc11f9c8efbe894c39d64d74f09 (diff)
downloadbcm5719-llvm-c078ca92ebe20fd497d9da68bc4b99fd2163f097.tar.gz
bcm5719-llvm-c078ca92ebe20fd497d9da68bc4b99fd2163f097.zip
[AMDGPU] Remove non-temporal flag from argument loads
Kernel arguments likely read by all workitems and should not bypass cache. Fixes performance hit in sub-dword argument loads. Differential Revision: https://reviews.llvm.org/D43249 llvm-svn: 325146
Diffstat (limited to 'llvm/lib/Target/AMDGPU/SIISelLowering.cpp')
-rw-r--r--llvm/lib/Target/AMDGPU/SIISelLowering.cpp1
1 files changed, 0 insertions, 1 deletions
diff --git a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp
index 0bda70daf08..a0b7a012c5a 100644
--- a/llvm/lib/Target/AMDGPU/SIISelLowering.cpp
+++ b/llvm/lib/Target/AMDGPU/SIISelLowering.cpp
@@ -1205,7 +1205,6 @@ SDValue SITargetLowering::lowerKernargMemParameter(
SDValue Ptr = lowerKernArgParameterPtr(DAG, SL, Chain, Offset);
SDValue Load = DAG.getLoad(MemVT, SL, Chain, Ptr, PtrInfo, Align,
- MachineMemOperand::MONonTemporal |
MachineMemOperand::MODereferenceable |
MachineMemOperand::MOInvariant);
OpenPOWER on IntegriCloud