summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorMatt Arsenault <Matthew.Arsenault@amd.com>2019-10-30 12:39:55 -0700
committerMatt Arsenault <arsenm2@gmail.com>2019-10-30 14:40:56 -0700
commitedca9ac0de3a5c10a21ef0c725501ea35791006a (patch)
treea142be965cd0a820c3efe2b48df99218f5fc70be
parent0202fa3a47b2eea06d43a6257ebfe5498fb7835b (diff)
downloadbcm5719-llvm-edca9ac0de3a5c10a21ef0c725501ea35791006a.tar.gz
bcm5719-llvm-edca9ac0de3a5c10a21ef0c725501ea35791006a.zip
AMDGPU: Don't fold S_NOPs with implicit operands
-rw-r--r--llvm/lib/Target/AMDGPU/SIShrinkInstructions.cpp4
-rw-r--r--llvm/test/CodeGen/AMDGPU/nop-fold.mir137
2 files changed, 140 insertions, 1 deletions
diff --git a/llvm/lib/Target/AMDGPU/SIShrinkInstructions.cpp b/llvm/lib/Target/AMDGPU/SIShrinkInstructions.cpp
index 8afca2cdc32..3986ca6dfa8 100644
--- a/llvm/lib/Target/AMDGPU/SIShrinkInstructions.cpp
+++ b/llvm/lib/Target/AMDGPU/SIShrinkInstructions.cpp
@@ -603,8 +603,10 @@ bool SIShrinkInstructions::runOnMachineFunction(MachineFunction &MF) {
// =>
// s_nop (N + M)
if (MI.getOpcode() == AMDGPU::S_NOP &&
+ MI.getNumOperands() == 1 && // Don't merge with implicit operands
Next != MBB.end() &&
- (*Next).getOpcode() == AMDGPU::S_NOP) {
+ (*Next).getOpcode() == AMDGPU::S_NOP &&
+ (*Next).getNumOperands() == 1) {
MachineInstr &NextMI = *Next;
// The instruction encodes the amount to wait with an offset of 1,
diff --git a/llvm/test/CodeGen/AMDGPU/nop-fold.mir b/llvm/test/CodeGen/AMDGPU/nop-fold.mir
new file mode 100644
index 00000000000..e014f321280
--- /dev/null
+++ b/llvm/test/CodeGen/AMDGPU/nop-fold.mir
@@ -0,0 +1,137 @@
+# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
+# RUN: llc --mtriple=amdgcn--amdhsa -mcpu=fiji -run-pass=si-shrink-instructions %s -o - | FileCheck %s
+
+---
+
+name: merge_2_nop
+tracksRegLiveness: true
+body: |
+ bb.0:
+
+ ; CHECK-LABEL: name: merge_2_nop
+ ; CHECK: S_NOP 1
+ S_NOP 0
+ S_NOP 0
+
+...
+
+---
+
+name: merge_3_nop
+tracksRegLiveness: true
+body: |
+ bb.0:
+
+ ; CHECK-LABEL: name: merge_3_nop
+ ; CHECK: S_NOP 2
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+
+
+...
+
+---
+
+name: merge_7_nop
+tracksRegLiveness: true
+body: |
+ bb.0:
+
+ ; CHECK-LABEL: name: merge_7_nop
+ ; CHECK: S_NOP 6
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+
+...
+
+---
+
+name: merge_8_nop
+tracksRegLiveness: true
+body: |
+ bb.0:
+
+ ; CHECK-LABEL: name: merge_8_nop
+ ; CHECK: S_NOP 7
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+
+...
+---
+
+name: merge_9_nop
+tracksRegLiveness: true
+body: |
+ bb.0:
+
+ ; CHECK-LABEL: name: merge_9_nop
+ ; CHECK: S_NOP 7
+ ; CHECK: S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+ S_NOP 0
+
+...
+
+---
+
+name: no_merge_impdef0
+tracksRegLiveness: true
+body: |
+ bb.0:
+
+ ; CHECK-LABEL: name: no_merge_impdef0
+ ; CHECK: S_NOP 0, implicit-def $sgpr0
+ ; CHECK: S_NOP 0
+ S_NOP 0, implicit-def $sgpr0
+ S_NOP 0
+
+...
+
+---
+
+name: no_merge_impdef1
+tracksRegLiveness: true
+body: |
+ bb.0:
+
+ ; CHECK-LABEL: name: no_merge_impdef1
+ ; CHECK: S_NOP 0
+ ; CHECK: S_NOP 0, implicit-def $sgpr0
+ S_NOP 0
+ S_NOP 0, implicit-def $sgpr0
+
+...
+
+---
+
+name: no_merge_impdef_both
+tracksRegLiveness: true
+body: |
+ bb.0:
+
+ ; CHECK-LABEL: name: no_merge_impdef_both
+ ; CHECK: S_NOP 0
+ ; CHECK: S_NOP 0, implicit-def $sgpr0
+ S_NOP 0
+ S_NOP 0, implicit-def $sgpr0
+
+...
OpenPOWER on IntegriCloud