summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen/AMDGPU/extload-align.ll
diff options
context:
space:
mode:
authorMatt Arsenault <Matthew.Arsenault@amd.com>2018-05-16 11:47:30 +0000
committerMatt Arsenault <Matthew.Arsenault@amd.com>2018-05-16 11:47:30 +0000
commit67a9815a5c9d0355020e17c0a494f7eaa1df21fe (patch)
tree3422ea805c0a69f22bcdec55e8c684b282498b59 /llvm/test/CodeGen/AMDGPU/extload-align.ll
parentca22d427b94de946d4ef32b8acbdfb7e62e7cfa4 (diff)
downloadbcm5719-llvm-67a9815a5c9d0355020e17c0a494f7eaa1df21fe.tar.gz
bcm5719-llvm-67a9815a5c9d0355020e17c0a494f7eaa1df21fe.zip
AMDGPU: Custom lower v4i16/v4f16 vector operations
Avoids stack access. Also handle extract hi elt pattern from truncate + shift to avoid a couple test regressions. llvm-svn: 332453
Diffstat (limited to 'llvm/test/CodeGen/AMDGPU/extload-align.ll')
-rw-r--r--llvm/test/CodeGen/AMDGPU/extload-align.ll8
1 files changed, 4 insertions, 4 deletions
diff --git a/llvm/test/CodeGen/AMDGPU/extload-align.ll b/llvm/test/CodeGen/AMDGPU/extload-align.ll
index ed6890e5c82..aa80ee4f64f 100644
--- a/llvm/test/CodeGen/AMDGPU/extload-align.ll
+++ b/llvm/test/CodeGen/AMDGPU/extload-align.ll
@@ -7,17 +7,17 @@ target datalayout = "A5"
; size and not 4 corresponding to the sign-extended size (i32).
; DEBUG: {{^}}# Machine code for function extload_align:
-; DEBUG: (load 2, addrspace 5)
+; DEBUG: (volatile load 2 from %ir.a, addrspace 5)
; DEBUG: {{^}}# End machine code for function extload_align.
define amdgpu_kernel void @extload_align(i32 addrspace(5)* %out, i32 %index) #0 {
%v0 = alloca [4 x i16], addrspace(5)
%a1 = getelementptr inbounds [4 x i16], [4 x i16] addrspace(5)* %v0, i32 0, i32 0
%a2 = getelementptr inbounds [4 x i16], [4 x i16] addrspace(5)* %v0, i32 0, i32 1
- store i16 0, i16 addrspace(5)* %a1
- store i16 1, i16 addrspace(5)* %a2
+ store volatile i16 0, i16 addrspace(5)* %a1
+ store volatile i16 1, i16 addrspace(5)* %a2
%a = getelementptr inbounds [4 x i16], [4 x i16] addrspace(5)* %v0, i32 0, i32 %index
- %val = load i16, i16 addrspace(5)* %a
+ %val = load volatile i16, i16 addrspace(5)* %a
%eval = sext i16 %val to i32
store i32 %eval, i32 addrspace(5)* %out
ret void
OpenPOWER on IntegriCloud