summaryrefslogtreecommitdiffstats
path: root/llvm/test/CodeGen/R600/fmuladd.ll
diff options
context:
space:
mode:
authorNiels Ole Salscheider <niels_ole@salscheider-online.de>2013-08-10 10:38:54 +0000
committerNiels Ole Salscheider <niels_ole@salscheider-online.de>2013-08-10 10:38:54 +0000
commitd3a039fed2c36d735ae4bbd43e0934d0303226af (patch)
tree0f97daafb0cbeef80ea57be7a7ee2412115ce726 /llvm/test/CodeGen/R600/fmuladd.ll
parent6509ac65a9c0177b27c5eb9d6aee0455a1f29c06 (diff)
downloadbcm5719-llvm-d3a039fed2c36d735ae4bbd43e0934d0303226af.tar.gz
bcm5719-llvm-d3a039fed2c36d735ae4bbd43e0934d0303226af.zip
R600/SI: FMA is faster than fmul and fadd for f64
llvm-svn: 188136
Diffstat (limited to 'llvm/test/CodeGen/R600/fmuladd.ll')
-rw-r--r--llvm/test/CodeGen/R600/fmuladd.ll31
1 files changed, 31 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/R600/fmuladd.ll b/llvm/test/CodeGen/R600/fmuladd.ll
new file mode 100644
index 00000000000..ac379f44aaa
--- /dev/null
+++ b/llvm/test/CodeGen/R600/fmuladd.ll
@@ -0,0 +1,31 @@
+; RUN: llc < %s -march=r600 -mcpu=SI | FileCheck %s
+
+; CHECK: @fmuladd_f32
+; CHECK: V_MAD_F32 {{VGPR[0-9]+, VGPR[0-9]+, VGPR[0-9]+, VGPR[0-9]+}}
+
+define void @fmuladd_f32(float addrspace(1)* %out, float addrspace(1)* %in1,
+ float addrspace(1)* %in2, float addrspace(1)* %in3) {
+ %r0 = load float addrspace(1)* %in1
+ %r1 = load float addrspace(1)* %in2
+ %r2 = load float addrspace(1)* %in3
+ %r3 = tail call float @llvm.fmuladd.f32(float %r0, float %r1, float %r2)
+ store float %r3, float addrspace(1)* %out
+ ret void
+}
+
+declare float @llvm.fmuladd.f32(float, float, float)
+
+; CHECK: @fmuladd_f64
+; CHECK: V_FMA_F64 {{VGPR[0-9]+_VGPR[0-9]+, VGPR[0-9]+_VGPR[0-9]+, VGPR[0-9]+_VGPR[0-9]+, VGPR[0-9]+_VGPR[0-9]+}}
+
+define void @fmuladd_f64(double addrspace(1)* %out, double addrspace(1)* %in1,
+ double addrspace(1)* %in2, double addrspace(1)* %in3) {
+ %r0 = load double addrspace(1)* %in1
+ %r1 = load double addrspace(1)* %in2
+ %r2 = load double addrspace(1)* %in3
+ %r3 = tail call double @llvm.fmuladd.f64(double %r0, double %r1, double %r2)
+ store double %r3, double addrspace(1)* %out
+ ret void
+}
+
+declare double @llvm.fmuladd.f64(double, double, double)
OpenPOWER on IntegriCloud