AMDGPU/SI: Add llvm.amdgcn.mov.dpp intrinsic

This intrinsic will be used to expose dpp functionality to higher-level languages. It will map to the dpp version of v_mov_b32. llvm-svn: 260792
author: Tom Stellard <thomas.stellard@amd.com> 2016-02-13 02:09:49 +0000
committer: Tom Stellard <thomas.stellard@amd.com> 2016-02-13 02:09:49 +0000
commit: 4409051d00a6b053354c93e28880c24aa00d598c (patch)
tree: ac8e4f0a30ac241a1fc8e30c687c974bcc77a401
parent: 7c7c3e35911f7f7c1709cac05b1d27ce19db5ab5 (diff)
download: bcm5719-llvm-4409051d00a6b053354c93e28880c24aa00d598c.tar.gz
bcm5719-llvm-4409051d00a6b053354c93e28880c24aa00d598c.zip
3 files changed, 30 insertions, 0 deletions
diff --git a/llvm/include/llvm/IR/IntrinsicsAMDGPU.td b/llvm/include/llvm/IR/IntrinsicsAMDGPU.td
index d2e76b449e0..ef3c24080b8 100644
--- a/llvm/include/llvm/IR/IntrinsicsAMDGPU.td
+++ b/llvm/include/llvm/IR/IntrinsicsAMDGPU.td
@@ -203,6 +203,12 @@ def int_amdgcn_buffer_wbinvl1_vol :
 // VI Intrinsics
 //===----------------------------------------------------------------------===//
 
+// llvm.amdgcn.mov.dpp.i32 <src> <dpp_ctrl> <bound_ctrl> <bank_mask> <row_mask>
+def int_amdgcn_mov_dpp :
+  Intrinsic<[llvm_anyint_ty],
+            [LLVMMatchType<0>, llvm_i32_ty, llvm_i1_ty, llvm_i32_ty,
+             llvm_i32_ty], [IntrNoMem, IntrConvergent]>;
+
 def int_amdgcn_s_dcache_wb :
   GCCBuiltin<"__builtin_amdgcn_s_dcache_wb">,
   Intrinsic<[], [], []>;
diff --git a/llvm/lib/Target/AMDGPU/VIInstructions.td b/llvm/lib/Target/AMDGPU/VIInstructions.td
index 1a7801c92bd..89f0a14ff84 100644
--- a/llvm/lib/Target/AMDGPU/VIInstructions.td
+++ b/llvm/lib/Target/AMDGPU/VIInstructions.td
@@ -109,4 +109,15 @@ def : Pat <
   (S_BUFFER_LOAD_DWORD_IMM $sbase, (as_i32imm $offset))
 >;
 
+//===----------------------------------------------------------------------===//
+// DPP Paterns
+//===----------------------------------------------------------------------===//
+
+def : Pat <
+  (int_amdgcn_mov_dpp i32:$src, imm:$dpp_ctrl, imm:$bound_ctrl,
+                      imm:$bank_mask, imm:$row_mask),
+  (V_MOV_B32_dpp $src, (as_i32imm $dpp_ctrl), (as_i1imm $bound_ctrl),
+                       (as_i32imm $bank_mask), (as_i32imm $row_mask))
+>;
+
 } // End Predicates = [isVI]
diff --git a/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.mov.dpp.ll b/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.mov.dpp.ll
new file mode 100644
index 00000000000..72ade215aa7
--- /dev/null
+++ b/llvm/test/CodeGen/AMDGPU/llvm.amdgcn.mov.dpp.ll
@@ -0,0 +1,13 @@
+; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefix=VI %s
+
+; VI-LABEL: {{^}}dpp_test:
+; VI: v_mov_b32 v0, v0, 1, -1, 1, 1 ; encoding: [0xfa,0x02,0x00,0x7e,0x00,0x01,0x08,0x11]
+define void @dpp_test(i32 addrspace(1)* %out, i32 %in) {
+  %tmp0 = call i32 @llvm.amdgcn.mov.dpp.i32(i32 %in, i32 1, i1 1, i32 1, i32 1) #0
+  store i32 %tmp0, i32 addrspace(1)* %out
+  ret void
+}
+
+declare i32 @llvm.amdgcn.mov.dpp.i32(i32, i32, i1, i32, i32) #0
+
+attributes #0 = { nounwind readnone convergent }
author	Tom Stellard <thomas.stellard@amd.com>	2016-02-13 02:09:49 +0000
committer	Tom Stellard <thomas.stellard@amd.com>	2016-02-13 02:09:49 +0000
commit	4409051d00a6b053354c93e28880c24aa00d598c (patch)
tree	ac8e4f0a30ac241a1fc8e30c687c974bcc77a401
parent	7c7c3e35911f7f7c1709cac05b1d27ce19db5ab5 (diff)
download	bcm5719-llvm-4409051d00a6b053354c93e28880c24aa00d598c.tar.gz bcm5719-llvm-4409051d00a6b053354c93e28880c24aa00d598c.zip