Add some missing isel predicates on def : pat patterns to avoid generating VFP vmla / vmls (they cause stalls). Disabling them in isel is properly not a right solution, I'll look into a proper solution next.

llvm-svn: 118922
author: Evan Cheng <evan.cheng@apple.com> 2010-11-12 20:32:20 +0000
committer: Evan Cheng <evan.cheng@apple.com> 2010-11-12 20:32:20 +0000
commit: 2d59ee34f11f63067c8ba6c1f894dfc6eddd802c (patch)
tree: 1edbfdd7fb4f2fddde96afc1cfd9fc18e77f5e23 /llvm/test/CodeGen/ARM/fnmscs.ll
parent: 6bb1ae9d45e1cff18273092ab320ea9dd51ee83e (diff)
download: bcm5719-llvm-2d59ee34f11f63067c8ba6c1f894dfc6eddd802c.tar.gz
bcm5719-llvm-2d59ee34f11f63067c8ba6c1f894dfc6eddd802c.zip
1 files changed, 56 insertions, 8 deletions
diff --git a/llvm/test/CodeGen/ARM/fnmscs.ll b/llvm/test/CodeGen/ARM/fnmscs.ll
index 0b47edd5f1f..5d832537c0f 100644
--- a/llvm/test/CodeGen/ARM/fnmscs.ll
+++ b/llvm/test/CodeGen/ARM/fnmscs.ll
@@ -1,23 +1,71 @@
-; RUN: llc < %s -march=arm -mattr=+vfp2 | FileCheck %s
-; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
-; RUN: llc < %s -march=arm -mcpu=cortex-a8 | FileCheck %s
-; RUN: llc < %s -march=arm -mcpu=cortex-a9 | FileCheck %s
+; RUN: llc < %s -march=arm -mattr=+vfp2 | FileCheck %s -check-prefix=VFP2
+; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s -check-prefix=NEON
+; RUN: llc < %s -march=arm -mcpu=cortex-a8 | FileCheck %s -check-prefix=A8
 
-define float @test1(float %acc, float %a, float %b) nounwind {
-; CHECK: vnmla.f32 s{{.*}}, s{{.*}}, s{{.*}}
+define float @t1(float %acc, float %a, float %b) nounwind {
 entry:
+; VFP2: t1:
+; VFP2: vnmla.f32
+
+; NEON: t1:
+; NEON: vnmla.f32
+
+; A8: t1:
+; A8: vnmul.f32 s0, s1, s0
+; A8: vsub.f32 d0, d0, d1
 	%0 = fmul float %a, %b
 	%1 = fsub float -0.0, %0
         %2 = fsub float %1, %acc
 	ret float %2
 }
 
-define float @test2(float %acc, float %a, float %b) nounwind {
-; CHECK: vnmla.f32 s{{.*}}, s{{.*}}, s{{.*}}
+define float @t2(float %acc, float %a, float %b) nounwind {
 entry:
+; VFP2: t2:
+; VFP2: vnmla.f32
+
+; NEON: t2:
+; NEON: vnmla.f32
+
+; A8: t2:
+; A8: vnmul.f32 s0, s1, s0
+; A8: vsub.f32 d0, d0, d1
 	%0 = fmul float %a, %b
 	%1 = fmul float -1.0, %0
         %2 = fsub float %1, %acc
 	ret float %2
 }
 
+define double @t3(double %acc, double %a, double %b) nounwind {
+entry:
+; VFP2: t3:
+; VFP2: vnmla.f64
+
+; NEON: t3:
+; NEON: vnmla.f64
+
+; A8: t3:
+; A8: vnmul.f64 d16, d16, d17
+; A8: vsub.f64 d16, d16, d17
+	%0 = fmul double %a, %b
+	%1 = fsub double -0.0, %0
+        %2 = fsub double %1, %acc
+	ret double %2
+}
+
+define double @t4(double %acc, double %a, double %b) nounwind {
+entry:
+; VFP2: t4:
+; VFP2: vnmla.f64
+
+; NEON: t4:
+; NEON: vnmla.f64
+
+; A8: t4:
+; A8: vnmul.f64 d16, d16, d17
+; A8: vsub.f64 d16, d16, d17
+	%0 = fmul double %a, %b
+	%1 = fmul double -1.0, %0
+        %2 = fsub double %1, %acc
+	ret double %2
+}
author	Evan Cheng <evan.cheng@apple.com>	2010-11-12 20:32:20 +0000
committer	Evan Cheng <evan.cheng@apple.com>	2010-11-12 20:32:20 +0000
commit	2d59ee34f11f63067c8ba6c1f894dfc6eddd802c (patch)
tree	1edbfdd7fb4f2fddde96afc1cfd9fc18e77f5e23 /llvm/test/CodeGen/ARM/fnmscs.ll
parent	6bb1ae9d45e1cff18273092ab320ea9dd51ee83e (diff)
download	bcm5719-llvm-2d59ee34f11f63067c8ba6c1f894dfc6eddd802c.tar.gz bcm5719-llvm-2d59ee34f11f63067c8ba6c1f894dfc6eddd802c.zip