summaryrefslogtreecommitdiffstats
path: root/llvm
diff options
context:
space:
mode:
authorDavid Green <david.green@arm.com>2018-06-21 08:30:07 +0000
committerDavid Green <david.green@arm.com>2018-06-21 08:30:07 +0000
commita465188500672de18918b8c5c36366622429a5ce (patch)
tree4f9ccfefc82e390c88ccfefebfaa7229f1aaea91 /llvm
parentaefd73e1b51d11ec92b0ccb69c5cfc8b8d782799 (diff)
downloadbcm5719-llvm-a465188500672de18918b8c5c36366622429a5ce.tar.gz
bcm5719-llvm-a465188500672de18918b8c5c36366622429a5ce.zip
[DAGCombine] Fix alignment for offset loads/stores
The alignment parameter to getExtLoad is treated as a base alignment, not the alignment of the load (base + offset). When we infer a better alignment for a Ptr we need to ensure that it applies to the base to prevent the alignment on the load from being wrong. This fixes a bug where the alignment could then be used to incorrectly prove noalias between a load and a store, leading to a miscompile. Differential Revision: https://reviews.llvm.org/D48029 llvm-svn: 335210
Diffstat (limited to 'llvm')
-rw-r--r--llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp14
-rw-r--r--llvm/test/CodeGen/ARM/alias_align.ll25
2 files changed, 33 insertions, 6 deletions
diff --git a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
index b29006c9967..22d55a1a0ef 100644
--- a/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
+++ b/llvm/lib/CodeGen/SelectionDAG/DAGCombiner.cpp
@@ -12231,13 +12231,14 @@ SDValue DAGCombiner::visitLOAD(SDNode *N) {
// Try to infer better alignment information than the load already has.
if (OptLevel != CodeGenOpt::None && LD->isUnindexed()) {
if (unsigned Align = DAG.InferPtrAlignment(Ptr)) {
- if (Align > LD->getMemOperand()->getBaseAlignment()) {
+ if (Align > LD->getAlignment() && LD->getSrcValueOffset() % Align == 0) {
SDValue NewLoad = DAG.getExtLoad(
LD->getExtensionType(), SDLoc(N), LD->getValueType(0), Chain, Ptr,
LD->getPointerInfo(), LD->getMemoryVT(), Align,
LD->getMemOperand()->getFlags(), LD->getAAInfo());
- if (NewLoad.getNode() != N)
- return CombineTo(N, NewLoad, SDValue(NewLoad.getNode(), 1), true);
+ // NewLoad will always be N as we are only refining the alignment
+ assert(NewLoad.getNode() == N);
+ (void)NewLoad;
}
}
}
@@ -14238,13 +14239,14 @@ SDValue DAGCombiner::visitSTORE(SDNode *N) {
// Try to infer better alignment information than the store already has.
if (OptLevel != CodeGenOpt::None && ST->isUnindexed()) {
if (unsigned Align = DAG.InferPtrAlignment(Ptr)) {
- if (Align > ST->getAlignment()) {
+ if (Align > ST->getAlignment() && ST->getSrcValueOffset() % Align == 0) {
SDValue NewStore =
DAG.getTruncStore(Chain, SDLoc(N), Value, Ptr, ST->getPointerInfo(),
ST->getMemoryVT(), Align,
ST->getMemOperand()->getFlags(), ST->getAAInfo());
- if (NewStore.getNode() != N)
- return CombineTo(ST, NewStore, true);
+ // NewStore will always be N as we are only refining the alignment
+ assert(NewStore.getNode() == N);
+ (void)NewStore;
}
}
}
diff --git a/llvm/test/CodeGen/ARM/alias_align.ll b/llvm/test/CodeGen/ARM/alias_align.ll
new file mode 100644
index 00000000000..452dfefbfcc
--- /dev/null
+++ b/llvm/test/CodeGen/ARM/alias_align.ll
@@ -0,0 +1,25 @@
+; RUN: llc < %s | FileCheck %s
+
+target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64"
+target triple = "armv8-arm-none-eabi"
+
+; Check the loads happen after the stores (note: directly returning 0 is also valid)
+; CHECK-LABEL: somesortofhash
+; CHECK-NOT: ldr
+; CHECK: str
+
+define i64 @somesortofhash() {
+entry:
+ %helper = alloca i8, i32 64, align 8
+ %helper.0.4x32 = bitcast i8* %helper to <4 x i32>*
+ %helper.20 = getelementptr inbounds i8, i8* %helper, i32 20
+ %helper.24 = getelementptr inbounds i8, i8* %helper, i32 24
+ store <4 x i32> zeroinitializer, <4 x i32>* %helper.0.4x32, align 8
+ %helper.20.32 = bitcast i8* %helper.20 to i32*
+ %helper.24.32 = bitcast i8* %helper.24 to i32*
+ store i32 0, i32* %helper.20.32
+ store i32 0, i32* %helper.24.32, align 8
+ %helper.20.64 = bitcast i8* %helper.20 to i64*
+ %load.helper.20.64 = load i64, i64* %helper.20.64, align 4
+ ret i64 %load.helper.20.64
+}
OpenPOWER on IntegriCloud