summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen/AMDGPU/llvm.round.ll
diff options
context:
space:
mode:
authorKonstantin Zhuravlyov <kzhuravl_dev@outlook.com>2017-04-13 23:17:00 +0000
committerKonstantin Zhuravlyov <kzhuravl_dev@outlook.com>2017-04-13 23:17:00 +0000
commitd24aeb20fc3ac57a2180380edbeb3c0fa0cd03b2 (patch)
treefb06f927219d033affee12be8f4da32198dd9289 /llvm/test/CodeGen/AMDGPU/llvm.round.ll
parentf93c58b81bfbe1e4502d8dd0465797fdd8fb400b (diff)
downloadbcm5719-llvm-d24aeb20fc3ac57a2180380edbeb3c0fa0cd03b2.tar.gz
bcm5719-llvm-d24aeb20fc3ac57a2180380edbeb3c0fa0cd03b2.zip
AMDGPU/GFX9: Do not use v_pack_b32_f16 when packing
Differential Revision: https://reviews.llvm.org/D31819 llvm-svn: 300275
Diffstat (limited to 'llvm/test/CodeGen/AMDGPU/llvm.round.ll')
-rw-r--r--llvm/test/CodeGen/AMDGPU/llvm.round.ll3
1 files changed, 2 insertions, 1 deletions
diff --git a/llvm/test/CodeGen/AMDGPU/llvm.round.ll b/llvm/test/CodeGen/AMDGPU/llvm.round.ll
index d211ad8ec9f..ffe87977870 100644
--- a/llvm/test/CodeGen/AMDGPU/llvm.round.ll
+++ b/llvm/test/CodeGen/AMDGPU/llvm.round.ll
@@ -87,7 +87,8 @@ define amdgpu_kernel void @round_f16(half addrspace(1)* %out, i32 %x.arg) #0 {
; GFX89: v_bfi_b32 [[COPYSIGN0:v[0-9]+]], [[K]], [[BFI_K]],
; GFX89: v_bfi_b32 [[COPYSIGN1:v[0-9]+]], [[K]], [[BFI_K]],
-; GFX9: v_pack_b32_f16
+; GFX9: v_and_b32_e32
+; GFX9: v_lshl_or_b32
define amdgpu_kernel void @round_v2f16(<2 x half> addrspace(1)* %out, i32 %in.arg) #0 {
%in = bitcast i32 %in.arg to <2 x half>
%result = call <2 x half> @llvm.round.v2f16(<2 x half> %in)
OpenPOWER on IntegriCloud