diff options
author | Tom Stellard <thomas.stellard@amd.com> | 2016-02-13 02:09:49 +0000 |
---|---|---|
committer | Tom Stellard <thomas.stellard@amd.com> | 2016-02-13 02:09:49 +0000 |
commit | 4409051d00a6b053354c93e28880c24aa00d598c (patch) | |
tree | ac8e4f0a30ac241a1fc8e30c687c974bcc77a401 | |
parent | 7c7c3e35911f7f7c1709cac05b1d27ce19db5ab5 (diff) | |
download | bcm5719-llvm-4409051d00a6b053354c93e28880c24aa00d598c.tar.gz bcm5719-llvm-4409051d00a6b053354c93e28880c24aa00d598c.zip |
AMDGPU/SI: Add llvm.amdgcn.mov.dpp intrinsic
This intrinsic will be used to expose dpp functionality to higher-level
languages. It will map to the dpp version of v_mov_b32.
llvm-svn: 260792
-rw-r--r-- | llvm/include/llvm/IR/IntrinsicsAMDGPU.td | 6 | ||||
-rw-r--r-- | llvm/lib/Target/AMDGPU/VIInstructions.td | 11 | ||||
-rw-r--r-- | llvm/test/CodeGen/AMDGPU/llvm.amdgcn.mov.dpp.ll | 13 |
3 files changed, 30 insertions, 0 deletions
diff --git a/llvm/include/llvm/IR/IntrinsicsAMDGPU.td b/llvm/include/llvm/IR/IntrinsicsAMDGPU.td index d2e76b449e0..ef3c24080b8 100644 --- a/llvm/include/llvm/IR/IntrinsicsAMDGPU.td +++ b/llvm/include/llvm/IR/IntrinsicsAMDGPU.td @@ -203,6 +203,12 @@ def int_amdgcn_buffer_wbinvl1_vol : // VI Intrinsics //===----------------------------------------------------------------------===// +// llvm.amdgcn.mov.dpp.i32 <src> <dpp_ctrl> <bound_ctrl> <bank_mask> <row_mask> +def int_amdgcn_mov_dpp : + Intrinsic<[llvm_anyint_ty], + [LLVMMatchType<0>, llvm_i32_ty, llvm_i1_ty, llvm_i32_ty, + llvm_i32_ty], [IntrNoMem, IntrConvergent]>; + def int_amdgcn_s_dcache_wb : GCCBuiltin<"__builtin_amdgcn_s_dcache_wb">, Intrinsic<[], [], []>; diff --git a/llvm/lib/Target/AMDGPU/VIInstructions.td b/llvm/lib/Target/AMDGPU/VIInstructions.td index 1a7801c92bd..89f0a14ff84 100644 --- a/llvm/lib/Target/AMDGPU/VIInstructions.td +++ b/llvm/lib/Target/AMDGPU/VIInstructions.td @@ -109,4 +109,15 @@ def : Pat < (S_BUFFER_LOAD_DWORD_IMM $sbase, (as_i32imm $offset)) >; +//===----------------------------------------------------------------------===// +// DPP Paterns +//===----------------------------------------------------------------------===// + +def : Pat < + (int_amdgcn_mov_dpp i32:$src, imm:$dpp_ctrl, imm:$bound_ctrl, + imm:$bank_mask, imm:$row_mask), + (V_MOV_B32_dpp $src, (as_i32imm $dpp_ctrl), (as_i1imm $bound_ctrl), + (as_i32imm $bank_mask), (as_i32imm $row_mask)) +>; + } // End Predicates = [isVI] diff --git a/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.mov.dpp.ll b/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.mov.dpp.ll new file mode 100644 index 00000000000..72ade215aa7 --- /dev/null +++ b/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.mov.dpp.ll @@ -0,0 +1,13 @@ +; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefix=VI %s + +; VI-LABEL: {{^}}dpp_test: +; VI: v_mov_b32 v0, v0, 1, -1, 1, 1 ; encoding: [0xfa,0x02,0x00,0x7e,0x00,0x01,0x08,0x11] +define void @dpp_test(i32 addrspace(1)* %out, i32 %in) { + %tmp0 = call i32 @llvm.amdgcn.mov.dpp.i32(i32 %in, i32 1, i1 1, i32 1, i32 1) #0 + store i32 %tmp0, i32 addrspace(1)* %out + ret void +} + +declare i32 @llvm.amdgcn.mov.dpp.i32(i32, i32, i1, i32, i32) #0 + +attributes #0 = { nounwind readnone convergent } |