AMDGPU: More bits of frame index are known to be zero

The maximum private allocation for the whole GPU is 4G, so the maximum possible index for a single workitem is the maximum size divided by the smallest granularity for a dispatch. This increases the number of known zero high bits, which enables more offset folding. The maximum private size per workitem with this is 128M but may be smaller still. llvm-svn: 262153
author: Matt Arsenault <Matthew.Arsenault@amd.com> 2016-02-27 20:26:57 +0000
committer: Matt Arsenault <Matthew.Arsenault@amd.com> 2016-02-27 20:26:57 +0000
commit: 3a61985b2fe922ee7c94c0aa148fad046347829d (patch)
tree: 2c8a3a6d5e4450fb7dd03f0535f7d827a210cd4d /llvm/test/CodeGen/AMDGPU/scratch-buffer.ll
parent: d6ebd07b8d1ba5fed46790e0246a2d0716c4b63b (diff)
download: bcm5719-llvm-3a61985b2fe922ee7c94c0aa148fad046347829d.tar.gz
bcm5719-llvm-3a61985b2fe922ee7c94c0aa148fad046347829d.zip
1 files changed, 3 insertions, 6 deletions
diff --git a/llvm/test/CodeGen/AMDGPU/scratch-buffer.ll b/llvm/test/CodeGen/AMDGPU/scratch-buffer.ll
index d43de476605..c992eb817e5 100644
--- a/llvm/test/CodeGen/AMDGPU/scratch-buffer.ll
+++ b/llvm/test/CodeGen/AMDGPU/scratch-buffer.ll
@@ -1,7 +1,5 @@
-; RUN: llc -verify-machineinstrs -march=amdgcn -mcpu=SI < %s | FileCheck --check-prefix=GCN --check-prefix=DEFAULT-SCRATCH %s
-; RUN: llc -verify-machineinstrs -march=amdgcn -mcpu=tonga < %s | FileCheck --check-prefix=GCN --check-prefix=DEFAULT-SCRATCH %s
-; RUN: llc -verify-machineinstrs -march=amdgcn -mattr=+huge-scratch-buffer -mcpu=SI < %s | FileCheck --check-prefix=GCN --check-prefix=HUGE-SCRATCH %s
-; RUN: llc -verify-machineinstrs -march=amdgcn -mattr=+huge-scratch-buffer -mcpu=tonga < %s | FileCheck --check-prefix=GCN --check-prefix=HUGE-SCRATCH %s
+; RUN: llc -verify-machineinstrs -march=amdgcn < %s | FileCheck -check-prefix=GCN %s
+; RUN: llc -verify-machineinstrs -march=amdgcn -mcpu=tonga < %s | FileCheck -check-prefix=GCN %s
 
 ; When a frame index offset is more than 12-bits, make sure we don't store
 ; it in mubuf's offset field.
@@ -102,8 +100,7 @@ entry:
 }
 
 ; GCN-LABEL: @pos_vaddr_offse
-; DEFAULT-SCRATCH: buffer_store_dword v{{[0-9]+}}, v{{[0-9]+}}, s[{{[0-9]+:[0-9]+}}], s{{[0-9]+}} offen offset:16
-; HUGE-SCRATCH: buffer_store_dword v{{[0-9]+}}, v{{[0-9]+}}, s[{{[0-9]+:[0-9]+}}], s{{[0-9]+}} offen{{$}}
+; GCN: buffer_store_dword v{{[0-9]+}}, v{{[0-9]+}}, s[{{[0-9]+:[0-9]+}}], s{{[0-9]+}} offen offset:16
 define void @pos_vaddr_offset(i32 addrspace(1)* %out, i32 %offset) {
 entry:
   %array = alloca [8192 x i32]
author	Matt Arsenault <Matthew.Arsenault@amd.com>	2016-02-27 20:26:57 +0000
committer	Matt Arsenault <Matthew.Arsenault@amd.com>	2016-02-27 20:26:57 +0000
commit	3a61985b2fe922ee7c94c0aa148fad046347829d (patch)
tree	2c8a3a6d5e4450fb7dd03f0535f7d827a210cd4d /llvm/test/CodeGen/AMDGPU/scratch-buffer.ll
parent	d6ebd07b8d1ba5fed46790e0246a2d0716c4b63b (diff)
download	bcm5719-llvm-3a61985b2fe922ee7c94c0aa148fad046347829d.tar.gz bcm5719-llvm-3a61985b2fe922ee7c94c0aa148fad046347829d.zip