summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp3
-rw-r--r--llvm/test/CodeGen/AMDGPU/lcssa-optnone.ll26
2 files changed, 29 insertions, 0 deletions
diff --git a/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp b/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp
index 0ea8db04c29..5f0c6a7c5f0 100644
--- a/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp
+++ b/llvm/lib/Target/AMDGPU/AMDGPUTargetMachine.cpp
@@ -882,6 +882,9 @@ bool GCNPassConfig::addInstSelector() {
addPass(createSILowerI1CopiesPass());
addPass(createSIFixupVectorISelPass());
addPass(createSIAddIMGInitPass());
+ // FIXME: Remove this once the phi on CF_END is cleaned up by either removing
+ // LCSSA or other ways.
+ addPass(&UnreachableMachineBlockElimID);
return false;
}
diff --git a/llvm/test/CodeGen/AMDGPU/lcssa-optnone.ll b/llvm/test/CodeGen/AMDGPU/lcssa-optnone.ll
new file mode 100644
index 00000000000..bda1412cbeb
--- /dev/null
+++ b/llvm/test/CodeGen/AMDGPU/lcssa-optnone.ll
@@ -0,0 +1,26 @@
+; RUN: llc -march=amdgcn -O0 -o - %s | FileCheck %s
+
+; CHECK-LABEL: non_uniform_loop
+; CHECK: s_endpgm
+define amdgpu_kernel void @non_uniform_loop(float addrspace(1)* %array) {
+entry:
+ %w = tail call i32 @llvm.amdgcn.workitem.id.x()
+ br label %for.cond
+
+for.cond:
+ %i = phi i32 [0, %entry], [%i.next, %for.inc]
+ %cmp = icmp ult i32 %i, %w
+ br i1 %cmp, label %for.body, label %for.end
+
+for.body:
+ br label %for.inc
+
+for.inc:
+ %i.next = add i32 %i, 1
+ br label %for.cond
+
+for.end:
+ ret void
+}
+
+declare i32 @llvm.amdgcn.workitem.id.x()
OpenPOWER on IntegriCloud