diff options
Diffstat (limited to 'llvm/test/CodeGen/AMDGPU/llvm.rint.ll')
-rw-r--r-- | llvm/test/CodeGen/AMDGPU/llvm.rint.ll | 62 |
1 files changed, 62 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/AMDGPU/llvm.rint.ll b/llvm/test/CodeGen/AMDGPU/llvm.rint.ll new file mode 100644 index 00000000000..661db51ad03 --- /dev/null +++ b/llvm/test/CodeGen/AMDGPU/llvm.rint.ll @@ -0,0 +1,62 @@ +; RUN: llc -march=r600 -mcpu=redwood < %s | FileCheck %s -check-prefix=R600 -check-prefix=FUNC +; RUN: llc -march=amdgcn -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s +; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s + +; FUNC-LABEL: {{^}}rint_f32: +; R600: RNDNE + +; SI: v_rndne_f32_e32 +define void @rint_f32(float addrspace(1)* %out, float %in) { +entry: + %0 = call float @llvm.rint.f32(float %in) #0 + store float %0, float addrspace(1)* %out + ret void +} + +; FUNC-LABEL: {{^}}rint_v2f32: +; R600: RNDNE +; R600: RNDNE + +; SI: v_rndne_f32_e32 +; SI: v_rndne_f32_e32 +define void @rint_v2f32(<2 x float> addrspace(1)* %out, <2 x float> %in) { +entry: + %0 = call <2 x float> @llvm.rint.v2f32(<2 x float> %in) #0 + store <2 x float> %0, <2 x float> addrspace(1)* %out + ret void +} + +; FUNC-LABEL: {{^}}rint_v4f32: +; R600: RNDNE +; R600: RNDNE +; R600: RNDNE +; R600: RNDNE + +; SI: v_rndne_f32_e32 +; SI: v_rndne_f32_e32 +; SI: v_rndne_f32_e32 +; SI: v_rndne_f32_e32 +define void @rint_v4f32(<4 x float> addrspace(1)* %out, <4 x float> %in) { +entry: + %0 = call <4 x float> @llvm.rint.v4f32(<4 x float> %in) #0 + store <4 x float> %0, <4 x float> addrspace(1)* %out + ret void +} + +; FUNC-LABEL: {{^}}legacy_amdil_round_nearest_f32: +; R600: RNDNE + +; SI: v_rndne_f32_e32 +define void @legacy_amdil_round_nearest_f32(float addrspace(1)* %out, float %in) { +entry: + %0 = call float @llvm.AMDIL.round.nearest.f32(float %in) #0 + store float %0, float addrspace(1)* %out + ret void +} + +declare float @llvm.AMDIL.round.nearest.f32(float) #0 +declare float @llvm.rint.f32(float) #0 +declare <2 x float> @llvm.rint.v2f32(<2 x float>) #0 +declare <4 x float> @llvm.rint.v4f32(<4 x float>) #0 + +attributes #0 = { nounwind readnone } |