diff options
| author | Jinsong Ji <jji@us.ibm.com> | 2018-11-20 14:55:43 +0000 |
|---|---|---|
| committer | Jinsong Ji <jji@us.ibm.com> | 2018-11-20 14:55:43 +0000 |
| commit | 42c13c22bc964f8dbb84d4e833b7558b89c9c87a (patch) | |
| tree | df737cf13031600bfbd2edc8e1c9fc8e6d77b6e5 | |
| parent | 56c74cff70c1a6ab640da900396418009caf67c1 (diff) | |
| download | bcm5719-llvm-42c13c22bc964f8dbb84d4e833b7558b89c9c87a.tar.gz bcm5719-llvm-42c13c22bc964f8dbb84d4e833b7558b89c9c87a.zip | |
[PowerPC][NFC]Add testcase for STWU scheduling check
This patch add a STWU testcase for scheduling check.
Currently P7/P8 which use itineraries are missing IIC_LdStStoreUpd,
We use CHECK-ITIN prefix to check P7/P8, then use default for P9 (and future).
We will fix the missing itineraries of IIC_LdStStoreUpd in following patch,
and update this testcase to show the scheduling difference only there.
Differential Revision: https://reviews.llvm.org/D54699
llvm-svn: 347310
| -rw-r--r-- | llvm/test/CodeGen/PowerPC/stwu-sched.ll | 72 |
1 files changed, 72 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/PowerPC/stwu-sched.ll b/llvm/test/CodeGen/PowerPC/stwu-sched.ll new file mode 100644 index 00000000000..f79956c9d76 --- /dev/null +++ b/llvm/test/CodeGen/PowerPC/stwu-sched.ll @@ -0,0 +1,72 @@ +; RUN: llc -mcpu=pwr9 -mtriple=powerpc64-unknown-linux-gnu < %s | FileCheck %s +; RUN: llc -mcpu=pwr9 -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck %s +; RUN: llc -mcpu=pwr8 -mtriple=powerpc64-unknown-linux-gnu < %s | FileCheck %s \ +; RUN: --check-prefix=CHECK-ITIN +; RUN: llc -mcpu=pwr8 -mtriple=powerpc64le-unknown-linux-gnu < %s | FileCheck %s \ +; RUN: --check-prefix=CHECK-ITIN + + +%0 = type { i32, i32 } + +; Function Attrs: norecurse nounwind writeonly +define void @initCombList(%0* nocapture, i32 signext) local_unnamed_addr #0 { +; CHECK-LABEL: initCombList: +; CHECK: addi 3, 3, -8 +; CHECK-NEXT: stwu 5, 64(4) + +; CHECK-ITIN-LABEL: initCombList: +; CHECK-ITIN: addi 3, 3, -8 +; CHECK-ITIN-NEXT: stwu 5, 64(4) + + + %3 = zext i32 %1 to i64 + br i1 undef, label %6, label %4 + +; <label>:4: ; preds = %2 + store i32 0, i32* undef, align 4, !tbaa !1 + %5 = add nuw nsw i64 0, 1 + br label %6 + +; <label>:6: ; preds = %4, %2 + %7 = phi i64 [ 0, %2 ], [ %5, %4 ] + br i1 undef, label %23, label %8 + +; <label>:8: ; preds = %8, %6 + %9 = phi i64 [ %21, %8 ], [ %7, %6 ] + %10 = getelementptr inbounds %0, %0* %0, i64 %9, i32 1 + store i32 0, i32* %10, align 4, !tbaa !1 + %11 = add nuw nsw i64 %9, 1 + %12 = getelementptr inbounds %0, %0* %0, i64 %11, i32 1 + store i32 0, i32* %12, align 4, !tbaa !1 + %13 = add nsw i64 %9, 2 + %14 = getelementptr inbounds %0, %0* %0, i64 %13, i32 1 + store i32 0, i32* %14, align 4, !tbaa !1 + %15 = add nsw i64 %9, 3 + %16 = getelementptr inbounds %0, %0* %0, i64 %15, i32 1 + store i32 0, i32* %16, align 4, !tbaa !1 + %17 = add nsw i64 %9, 4 + %18 = getelementptr inbounds %0, %0* %0, i64 %17, i32 1 + store i32 0, i32* %18, align 4, !tbaa !1 + %19 = add nsw i64 %9, 6 + %20 = getelementptr inbounds %0, %0* %0, i64 %19, i32 1 + store i32 0, i32* %20, align 4, !tbaa !1 + %21 = add nsw i64 %9, 8 + %22 = icmp eq i64 %21, %3 + br i1 %22, label %23, label %8, !llvm.loop !6 + +; <label>:23: ; preds = %8, %6 + ret void +} + +attributes #0 = { norecurse nounwind writeonly "correctly-rounded-divide-sqrt-fp-math"="false" "disable-tail-calls"="false" "less-precise-fpmad"="false" "min-legal-vector-width"="0" "no-frame-pointer-elim"="false" "no-infs-fp-math"="false" "no-jump-tables"="false" "no-nans-fp-math"="false" "no-signed-zeros-fp-math"="false" "no-trapping-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="ppc64le" "target-features"="+altivec,+bpermd,+crypto,+direct-move,+extdiv,+htm,+power8-vector,+vsx,-power9-vector,-qpx" "unsafe-fp-math"="false" "use-soft-float"="false" } + +!llvm.ident = !{!0} + +!0 = !{!"clang version 8.0.0 "} +!1 = !{!2, !3, i64 4} +!2 = !{!"", !3, i64 0, !3, i64 4} +!3 = !{!"int", !4, i64 0} +!4 = !{!"omnipotent char", !5, i64 0} +!5 = !{!"Simple C/C++ TBAA"} +!6 = distinct !{!6, !7} +!7 = !{!"llvm.loop.isvectorized", i32 1} |

