diff options
Diffstat (limited to 'llvm/test/CodeGen/AMDGPU/wave32.ll')
-rw-r--r-- | llvm/test/CodeGen/AMDGPU/wave32.ll | 29 |
1 files changed, 23 insertions, 6 deletions
diff --git a/llvm/test/CodeGen/AMDGPU/wave32.ll b/llvm/test/CodeGen/AMDGPU/wave32.ll index 85c79144d0e..91a99318197 100644 --- a/llvm/test/CodeGen/AMDGPU/wave32.ll +++ b/llvm/test/CodeGen/AMDGPU/wave32.ll @@ -232,14 +232,31 @@ bb13: ; GCN: s_cbranch_execz ; GCN: BB{{.*}}: ; GCN: BB{{.*}}: -; GFX1032: s_andn2_b32 s{{[0-9]+}}, s{{[0-9]+}}, exec_lo -; GFX1064: s_andn2_b64 s[{{[0-9:]+}}], s[{{[0-9:]+}}], exec -; GFX1032: s_or_b32 s{{[0-9]+}}, vcc_lo, s{{[0-9]+}} -; GFX1032: s_or_b32 s{{[0-9]+}}, s{{[0-9]+}}, s{{[0-9]+}} -; GFX1064: s_or_b64 s[{{[0-9:]+}}], vcc, s[{{[0-9:]+}}] -; GFX1064: s_or_b64 s[{{[0-9:]+}}], s[{{[0-9:]+}}], s[{{[0-9:]+}}] + +; GFX1032: s_or_b32 [[MASK0:s[0-9]+]], [[MASK0]], vcc_lo +; GFX1064: s_or_b64 [[MASK0:s\[[0-9:]+\]]], [[MASK0]], vcc +; GFX1032: s_andn2_b32 [[MASK1:s[0-9]+]], [[MASK1]], exec_lo +; GFX1064: s_andn2_b64 [[MASK1:s\[[0-9:]+\]]], [[MASK1]], exec +; GCN: global_store_dword +; GFX1032: s_and_b32 [[MASK0]], [[MASK0]], exec_lo +; GFX1064: s_and_b64 [[MASK0]], [[MASK0]], exec +; GFX1032: s_or_b32 [[MASK1]], [[MASK1]], [[MASK0]] +; GFX1064: s_or_b64 [[MASK1]], [[MASK1]], [[MASK0]] +; GCN: BB{{.*}}: ; %Flow +; GFX1032: s_and_b32 [[MASK0:s[0-9]+]], exec_lo, [[MASK1]] +; GFX1064: s_and_b64 [[MASK0:s\[[0-9:]+\]]], exec, [[MASK1]] +; GFX1032: s_or_b32 [[MASK0]], [[MASK0]], [[ACC:s[0-9]+]] +; GFX1064: s_or_b64 [[MASK0]], [[MASK0]], [[ACC:s\[[0-9:]+\]]] +; GFX1032: s_mov_b32 [[ACC]], [[MASK0]] +; GFX1064: s_mov_b64 [[ACC]], [[MASK0]] +; GFX1032: s_andn2_b32 exec_lo, exec_lo, [[MASK0]] +; GFX1064: s_andn2_b64 exec, exec, [[MASK0]] ; GCN: s_cbranch_execz ; GCN: BB{{.*}}: +; GCN: s_load_dword [[LOAD:s[0-9]+]] +; GFX1032: s_or_b32 [[MASK1]], [[MASK1]], exec_lo +; GFX1064: s_or_b64 [[MASK1]], [[MASK1]], exec +; GCN: s_cmp_lt_i32 [[LOAD]], 11 define amdgpu_kernel void @test_loop_with_if_else_break(i32 addrspace(1)* %arg) #0 { bb: %tmp = tail call i32 @llvm.amdgcn.workitem.id.x() |