summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen/SystemZ/fp-abs-03.ll
diff options
context:
space:
mode:
authorUlrich Weigand <ulrich.weigand@de.ibm.com>2017-07-17 17:42:48 +0000
committerUlrich Weigand <ulrich.weigand@de.ibm.com>2017-07-17 17:42:48 +0000
commit33435c4c9c1dcecd109aef3d23d46ea43618d9ae (patch)
tree0e6a868ea02a04314fca2d6bc2a926c66aad666d /llvm/test/CodeGen/SystemZ/fp-abs-03.ll
parent2b3482fe8576f8e5de0d296baae5dfb290b9948a (diff)
downloadbcm5719-llvm-33435c4c9c1dcecd109aef3d23d46ea43618d9ae.tar.gz
bcm5719-llvm-33435c4c9c1dcecd109aef3d23d46ea43618d9ae.zip
[SystemZ] Add support for IBM z14 processor (2/3)
This adds support for the new 32-bit vector float instructions of z14. This includes: - Enabling the instructions for the assembler/disassembler. - CodeGen for the instructions, including new LLVM intrinsics. - Scheduler description support for the instructions. - Update to the vector cost function calculations. In general, CodeGen support for the new v4f32 instructions closely matches support for the existing v2f64 instructions. llvm-svn: 308195
Diffstat (limited to 'llvm/test/CodeGen/SystemZ/fp-abs-03.ll')
-rw-r--r--llvm/test/CodeGen/SystemZ/fp-abs-03.ll40
1 files changed, 40 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/SystemZ/fp-abs-03.ll b/llvm/test/CodeGen/SystemZ/fp-abs-03.ll
new file mode 100644
index 00000000000..ccb69642a2c
--- /dev/null
+++ b/llvm/test/CodeGen/SystemZ/fp-abs-03.ll
@@ -0,0 +1,40 @@
+; Test floating-point absolute on z14.
+;
+; RUN: llc < %s -mtriple=s390x-linux-gnu -mcpu=z14 | FileCheck %s
+
+; Test f32.
+declare float @llvm.fabs.f32(float %f)
+define float @f1(float %f) {
+; CHECK-LABEL: f1:
+; CHECK: lpdfr %f0, %f0
+; CHECK: br %r14
+ %res = call float @llvm.fabs.f32(float %f)
+ ret float %res
+}
+
+; Test f64.
+declare double @llvm.fabs.f64(double %f)
+define double @f2(double %f) {
+; CHECK-LABEL: f2:
+; CHECK: lpdfr %f0, %f0
+; CHECK: br %r14
+ %res = call double @llvm.fabs.f64(double %f)
+ ret double %res
+}
+
+; Test f128. With the loads and stores, a pure absolute would probably
+; be better implemented using an NI on the upper byte. Do some extra
+; processing so that using FPRs is unequivocally better.
+declare fp128 @llvm.fabs.f128(fp128 %f)
+define void @f3(fp128 *%ptr, fp128 *%ptr2) {
+; CHECK-LABEL: f3:
+; CHECK: lpxbr
+; CHECK: dxbr
+; CHECK: br %r14
+ %orig = load fp128 , fp128 *%ptr
+ %abs = call fp128 @llvm.fabs.f128(fp128 %orig)
+ %op2 = load fp128 , fp128 *%ptr2
+ %res = fdiv fp128 %abs, %op2
+ store fp128 %res, fp128 *%ptr
+ ret void
+}
OpenPOWER on IntegriCloud