diff options
Diffstat (limited to 'llvm/test/CodeGen/AMDGPU/or.ll')
-rw-r--r-- | llvm/test/CodeGen/AMDGPU/or.ll | 102 |
1 files changed, 99 insertions, 3 deletions
diff --git a/llvm/test/CodeGen/AMDGPU/or.ll b/llvm/test/CodeGen/AMDGPU/or.ll index 56f54cf7c5e..3e254850a93 100644 --- a/llvm/test/CodeGen/AMDGPU/or.ll +++ b/llvm/test/CodeGen/AMDGPU/or.ll @@ -1,5 +1,5 @@ -; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s ; RUN: llc -march=amdgcn -mcpu=verde -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s +; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s ; RUN: llc -march=r600 -mcpu=redwood < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s @@ -62,6 +62,75 @@ define void @scalar_or_literal_i32(i32 addrspace(1)* %out, i32 %a) { ret void } +; FUNC-LABEL: {{^}}scalar_or_literal_i64: +; SI: s_load_dwordx2 s{{\[}}[[LO:[0-9]+]]:[[HI:[0-9]+]]{{\]}}, s{{\[[0-9]+:[0-9]+\]}}, {{0xb|0x2c}} +; SI-DAG: s_or_b32 s[[RES_HI:[0-9]+]], s[[HI]], 0xf237b +; SI-DAG: s_or_b32 s[[RES_LO:[0-9]+]], s[[LO]], 0x3039 +; SI-DAG: v_mov_b32_e32 v{{[0-9]+}}, s[[RES_LO]] +; SI-DAG: v_mov_b32_e32 v{{[0-9]+}}, s[[RES_HI]] +define void @scalar_or_literal_i64(i64 addrspace(1)* %out, i64 %a) { + %or = or i64 %a, 4261135838621753 + store i64 %or, i64 addrspace(1)* %out + ret void +} + +; FUNC-LABEL: {{^}}scalar_or_literal_multi_use_i64: +; SI: s_load_dwordx2 s{{\[}}[[LO:[0-9]+]]:[[HI:[0-9]+]]{{\]}}, s{{\[[0-9]+:[0-9]+\]}}, {{0xb|0x2c}} +; SI-DAG: s_mov_b32 s[[K_HI:[0-9]+]], 0xf237b +; SI-DAG: s_movk_i32 s[[K_LO:[0-9]+]], 0x3039 +; SI: s_or_b64 s{{\[[0-9]+:[0-9]+\]}}, s{{\[[0-9]+:[0-9]+\]}}, s{{\[}}[[K_LO]]:[[K_HI]]{{\]}} + +; SI: s_add_u32 s{{[0-9]+}}, s{{[0-9]+}}, s[[K_LO]] +; SI: s_addc_u32 s{{[0-9]+}}, s{{[0-9]+}}, s[[K_HI]] +define void @scalar_or_literal_multi_use_i64(i64 addrspace(1)* %out, i64 %a, i64 %b) { + %or = or i64 %a, 4261135838621753 + store i64 %or, i64 addrspace(1)* %out + + %foo = add i64 %b, 4261135838621753 + store volatile i64 %foo, i64 addrspace(1)* undef + ret void +} + +; FUNC-LABEL: {{^}}scalar_or_inline_imm_i64: +; SI: s_load_dwordx2 s{{\[}}[[VAL_LO:[0-9]+]]:[[VAL_HI:[0-9]+]]{{\]}}, s{{\[[0-9]+:[0-9]+\]}}, {{0xb|0x2c}} +; SI-NOT: or_b32 +; SI: s_or_b32 s[[VAL_LO]], s[[VAL_LO]], 63 +; SI-NOT: or_b32 +; SI: v_mov_b32_e32 v[[VLO:[0-9]+]], s[[VAL_LO]] +; SI-NOT: or_b32 +; SI: v_mov_b32_e32 v[[VHI:[0-9]+]], s[[VAL_HI]] +; SI-NOT: or_b32 +; SI: buffer_store_dwordx2 v{{\[}}[[VLO]]:[[VHI]]{{\]}} +define void @scalar_or_inline_imm_i64(i64 addrspace(1)* %out, i64 %a) { + %or = or i64 %a, 63 + store i64 %or, i64 addrspace(1)* %out + ret void +} + +; FUNC-LABEL: {{^}}scalar_or_inline_imm_multi_use_i64: +; SI-NOT: or_b32 +; SI: s_or_b32 s{{[0-9]+}}, s{{[0-9]+}}, 63 +; SI-NOT: or_b32 +define void @scalar_or_inline_imm_multi_use_i64(i64 addrspace(1)* %out, i64 %a, i64 %b) { + %or = or i64 %a, 63 + store i64 %or, i64 addrspace(1)* %out + %foo = add i64 %b, 63 + store volatile i64 %foo, i64 addrspace(1)* undef + ret void +} + +; FUNC-LABEL: {{^}}scalar_or_neg_inline_imm_i64: +; SI-DAG: s_load_dword [[VAL:s[0-9]+]] +; SI-DAG: s_or_b32 [[VAL]], [[VAL]], -8 +; SI-DAG: v_mov_b32_e32 v[[V_HI:[0-9]+]], -1{{$}} +; SI-DAG: v_mov_b32_e32 v[[V_LO:[0-9]+]], [[VAL]] +; SI: buffer_store_dwordx2 v{{\[}}[[V_LO]]:[[V_HI]]{{\]}} +define void @scalar_or_neg_inline_imm_i64(i64 addrspace(1)* %out, i64 %a) { + %or = or i64 %a, -8 + store i64 %or, i64 addrspace(1)* %out + ret void +} + ; FUNC-LABEL: {{^}}vector_or_literal_i32: ; SI: v_or_b32_e32 v{{[0-9]+}}, 0xffff, v{{[0-9]+}} define void @vector_or_literal_i32(i32 addrspace(1)* %out, i32 addrspace(1)* %a, i32 addrspace(1)* %b) { @@ -127,8 +196,9 @@ define void @vector_or_i64_loadimm(i64 addrspace(1)* %out, i64 addrspace(1)* %a, ; FIXME: The or 0 should really be removed. ; FUNC-LABEL: {{^}}vector_or_i64_imm: ; SI: buffer_load_dwordx2 v{{\[}}[[LO_VREG:[0-9]+]]:[[HI_VREG:[0-9]+]]{{\]}}, -; SI: v_or_b32_e32 {{v[0-9]+}}, 8, v[[LO_VREG]] -; SI: v_or_b32_e32 {{v[0-9]+}}, 0, {{.*}} +; SI: v_or_b32_e32 v[[LO_RESULT:[0-9]+]], 8, v[[LO_VREG]] +; SI-NOT: v_or_b32_e32 {{v[0-9]+}}, 0 +; SI: buffer_store_dwordx2 v{{\[}}[[LO_RESULT]]:[[HI_VREG]]{{\]}} ; SI: s_endpgm define void @vector_or_i64_imm(i64 addrspace(1)* %out, i64 addrspace(1)* %a, i64 addrspace(1)* %b) { %loada = load i64, i64 addrspace(1)* %a, align 8 @@ -137,6 +207,32 @@ define void @vector_or_i64_imm(i64 addrspace(1)* %out, i64 addrspace(1)* %a, i64 ret void } +; FUNC-LABEL: {{^}}vector_or_i64_neg_inline_imm: +; SI-DAG: buffer_load_dword v[[LO_VREG:[0-9]+]] +; SI-DAG: v_or_b32_e32 v[[RES_LO:[0-9]+]], -8, v[[LO_VREG]] +; SI-DAG: v_mov_b32_e32 v[[RES_HI:[0-9]+]], -1{{$}} +; SI: buffer_store_dwordx2 v{{\[}}[[RES_LO]]:[[RES_HI]]{{\]}} +; SI: s_endpgm +define void @vector_or_i64_neg_inline_imm(i64 addrspace(1)* %out, i64 addrspace(1)* %a, i64 addrspace(1)* %b) { + %loada = load i64, i64 addrspace(1)* %a, align 8 + %or = or i64 %loada, -8 + store i64 %or, i64 addrspace(1)* %out + ret void +} + +; FUNC-LABEL: {{^}}vector_or_i64_neg_literal: +; SI-DAG: buffer_load_dword v[[LO_VREG:[0-9]+]] +; SI-DAG: v_mov_b32_e32 v{{[0-9]+}}, -1{{$}} +; SI-DAG: v_or_b32_e32 {{v[0-9]+}}, 0xffffff38, v[[LO_VREG]] +; SI: buffer_store_dwordx2 +; SI: s_endpgm +define void @vector_or_i64_neg_literal(i64 addrspace(1)* %out, i64 addrspace(1)* %a, i64 addrspace(1)* %b) { + %loada = load i64, i64 addrspace(1)* %a, align 8 + %or = or i64 %loada, -200 + store i64 %or, i64 addrspace(1)* %out + ret void +} + ; FUNC-LABEL: {{^}}trunc_i64_or_to_i32: ; SI: s_load_dword s[[SREG0:[0-9]+]] ; SI: s_load_dword s[[SREG1:[0-9]+]] |