summaryrefslogtreecommitdiffstats
path: root/llvm/test/Transforms/EarlyCSE
diff options
context:
space:
mode:
authorMatt Arsenault <Matthew.Arsenault@amd.com>2019-02-25 20:16:11 +0000
committerMatt Arsenault <Matthew.Arsenault@amd.com>2019-02-25 20:16:11 +0000
commitf97ace5639863bde1eb4cc9081d191896657b56b (patch)
tree650289c852732ff29ddd2c1de2dcfbf28ac2650c /llvm/test/Transforms/EarlyCSE
parent84b3288853aaf54295c7493a439473407262ec16 (diff)
downloadbcm5719-llvm-f97ace5639863bde1eb4cc9081d191896657b56b.tar.gz
bcm5719-llvm-f97ace5639863bde1eb4cc9081d191896657b56b.zip
AMDGPU: Remove IntrReadMem from memtime/memrealtime intrinsics
EarlyCSE with MemorySSA was able to use this to merge multiple calls with no intervening store. llvm-svn: 354814
Diffstat (limited to 'llvm/test/Transforms/EarlyCSE')
-rw-r--r--llvm/test/Transforms/EarlyCSE/AMDGPU/lit.local.cfg5
-rw-r--r--llvm/test/Transforms/EarlyCSE/AMDGPU/memrealtime.ll43
2 files changed, 48 insertions, 0 deletions
diff --git a/llvm/test/Transforms/EarlyCSE/AMDGPU/lit.local.cfg b/llvm/test/Transforms/EarlyCSE/AMDGPU/lit.local.cfg
new file mode 100644
index 00000000000..4536d089640
--- /dev/null
+++ b/llvm/test/Transforms/EarlyCSE/AMDGPU/lit.local.cfg
@@ -0,0 +1,5 @@
+config.suffixes = ['.ll']
+
+targets = set(config.root.targets_to_build.split())
+if not 'AMDGPU' in targets:
+ config.unsupported = True
diff --git a/llvm/test/Transforms/EarlyCSE/AMDGPU/memrealtime.ll b/llvm/test/Transforms/EarlyCSE/AMDGPU/memrealtime.ll
new file mode 100644
index 00000000000..6b42ee8d71e
--- /dev/null
+++ b/llvm/test/Transforms/EarlyCSE/AMDGPU/memrealtime.ll
@@ -0,0 +1,43 @@
+; RUN: opt -S -mtriple=amdgcn-amd-amdhsa -early-cse-memssa < %s | FileCheck %s
+target datalayout = "e-p:64:64-p1:64:64-p2:32:32-p3:32:32-p4:64:64-p5:32:32-p6:32:32-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64-S32-A5"
+
+; CHECK-LABEL: @memrealtime(
+; CHECK: call i64 @llvm.amdgcn.s.memrealtime()
+; CHECK: call i64 @llvm.amdgcn.s.memrealtime()
+define amdgpu_kernel void @memrealtime(i64 %cycles) #0 {
+entry:
+ %0 = tail call i64 @llvm.amdgcn.s.memrealtime()
+ %cmp3 = icmp sgt i64 %cycles, 0
+ br i1 %cmp3, label %while.body, label %while.end
+
+while.body:
+ %1 = tail call i64 @llvm.amdgcn.s.memrealtime()
+ %sub = sub nsw i64 %1, %0
+ %cmp = icmp slt i64 %sub, %cycles
+ br i1 %cmp, label %while.body, label %while.end
+
+while.end:
+ ret void
+}
+
+; CHECK-LABEL: @memtime(
+; CHECK: call i64 @llvm.amdgcn.s.memtime()
+; CHECK: call i64 @llvm.amdgcn.s.memtime()
+define amdgpu_kernel void @memtime(i64 %cycles) #0 {
+entry:
+ %0 = tail call i64 @llvm.amdgcn.s.memtime()
+ %cmp3 = icmp sgt i64 %cycles, 0
+ br i1 %cmp3, label %while.body, label %while.end
+
+while.body:
+ %1 = tail call i64 @llvm.amdgcn.s.memtime()
+ %sub = sub nsw i64 %1, %0
+ %cmp = icmp slt i64 %sub, %cycles
+ br i1 %cmp, label %while.body, label %while.end
+
+while.end:
+ ret void
+}
+
+declare i64 @llvm.amdgcn.s.memrealtime()
+declare i64 @llvm.amdgcn.s.memtime()
OpenPOWER on IntegriCloud