diff options
author | Lawrence Hu <lawrence@codeaurora.org> | 2016-04-30 00:51:22 +0000 |
---|---|---|
committer | Lawrence Hu <lawrence@codeaurora.org> | 2016-04-30 00:51:22 +0000 |
commit | 1befea2bdcb2514298441fd15adf89e65548faeb (patch) | |
tree | 79eac202eba2db4e9da16b4648d4fbaef9aa3454 /llvm/test | |
parent | df29078dc84e22ff99dc11dfe2c926a4098d4d81 (diff) | |
download | bcm5719-llvm-1befea2bdcb2514298441fd15adf89e65548faeb.tar.gz bcm5719-llvm-1befea2bdcb2514298441fd15adf89e65548faeb.zip |
Reroll loops with multiple IV and negative step part 3
support multiple induction variables
This patch enable loop reroll for the following case:
for(int i=0; i<N; i += 2) {
S += *a++;
S += *a++;
};
Differential Revision: http://reviews.llvm.org/D16550
llvm-svn: 268147
Diffstat (limited to 'llvm/test')
-rw-r--r-- | llvm/test/Transforms/LoopReroll/complex_reroll.ll | 134 |
1 files changed, 134 insertions, 0 deletions
diff --git a/llvm/test/Transforms/LoopReroll/complex_reroll.ll b/llvm/test/Transforms/LoopReroll/complex_reroll.ll new file mode 100644 index 00000000000..3a2c7221578 --- /dev/null +++ b/llvm/test/Transforms/LoopReroll/complex_reroll.ll @@ -0,0 +1,134 @@ +; RUN: opt -S -loop-reroll %s | FileCheck %s +declare i32 @goo(i32, i32) + +@buf = external global i8* +@aaa = global [16 x i8] c"\01\02\03\04\05\06\07\08\09\0A\0B\0C\0D\0E\0F\10", align 1 + +define i32 @test1(i32 %len) { +entry: + br label %while.body + +while.body: +;CHECK-LABEL: while.body: +;CHECK-NEXT: %indvar = phi i32 [ %indvar.next, %while.body ], [ 0, %entry ] +;CHECK-NEXT: %buf.021 = phi i8* [ getelementptr inbounds ([16 x i8], [16 x i8]* @aaa, i64 0, i64 0), %entry ], [ %add.ptr, %while.body ] +;CHECK-NEXT: %sum44.020 = phi i64 [ 0, %entry ], [ %add, %while.body ] +;CHECK-NEXT: [[T2:%[0-9]+]] = load i8, i8* %buf.021, align 1 +;CHECK-NEXT: %conv = zext i8 [[T2]] to i64 +;CHECK-NEXT: %add = add i64 %conv, %sum44.020 +;CHECK-NEXT: %add.ptr = getelementptr inbounds i8, i8* %buf.021, i64 1 +;CHECK-NEXT: %indvar.next = add i32 %indvar, 1 +;CHECK-NEXT: %exitcond = icmp eq i32 %indvar, 1 +;CHECK-NEXT: br i1 %exitcond, label %while.end, label %while.body + + %dec22 = phi i32 [ 4, %entry ], [ %dec, %while.body ] + %buf.021 = phi i8* [ getelementptr inbounds ([16 x i8], [16 x i8]* @aaa, i64 0, i64 0), %entry ], [ %add.ptr, %while.body ] + %sum44.020 = phi i64 [ 0, %entry ], [ %add9, %while.body ] + %0 = load i8, i8* %buf.021, align 1 + %conv = zext i8 %0 to i64 + %add = add i64 %conv, %sum44.020 + %arrayidx1 = getelementptr inbounds i8, i8* %buf.021, i64 1 + %1 = load i8, i8* %arrayidx1, align 1 + %conv2 = zext i8 %1 to i64 + %add3 = add i64 %add, %conv2 + %arrayidx4 = getelementptr inbounds i8, i8* %buf.021, i64 2 + %2 = load i8, i8* %arrayidx4, align 1 + %conv5 = zext i8 %2 to i64 + %add6 = add i64 %add3, %conv5 + %arrayidx7 = getelementptr inbounds i8, i8* %buf.021, i64 3 + %3 = load i8, i8* %arrayidx7, align 1 + %conv8 = zext i8 %3 to i64 + %add9 = add i64 %add6, %conv8 + %add.ptr = getelementptr inbounds i8, i8* %buf.021, i64 4 + %dec = add nsw i32 %dec22, -1 + %tobool = icmp eq i32 %dec, 0 + br i1 %tobool, label %while.end, label %while.body + +while.end: ; preds = %while.body + %conv11 = trunc i64 %add9 to i32 + %call = tail call i32 @goo(i32 0, i32 %conv11) + unreachable +} + +define i32 @test2(i32 %N, i32* nocapture readonly %a, i32 %S) { +entry: + %cmp.9 = icmp sgt i32 %N, 0 + br i1 %cmp.9, label %for.body.lr.ph, label %for.cond.cleanup + +for.body.lr.ph: + br label %for.body + +for.cond.for.cond.cleanup_crit_edge: + br label %for.cond.cleanup + +for.cond.cleanup: + %S.addr.0.lcssa = phi i32 [ %add2, %for.cond.for.cond.cleanup_crit_edge ], [ %S, %entry ] + ret i32 %S.addr.0.lcssa + +for.body: +;CHECK-LABEL: for.body: +;CHECK-NEXT: %indvar = phi i32 [ %indvar.next, %for.body ], [ 0, %for.body.lr.ph ] +;CHECK-NEXT: %S.addr.011 = phi i32 [ %S, %for.body.lr.ph ], [ %add, %for.body ] +;CHECK-NEXT: %a.addr.010 = phi i32* [ %a, %for.body.lr.ph ], [ %incdec.ptr1, %for.body ] +;CHECK-NEXT: %4 = load i32, i32* %a.addr.010, align 4 +;CHECK-NEXT: %add = add nsw i32 %4, %S.addr.011 +;CHECK-NEXT: %incdec.ptr1 = getelementptr inbounds i32, i32* %a.addr.010, i64 1 +;CHECK-NEXT: %indvar.next = add i32 %indvar, 1 +;CHECK-NEXT: %exitcond = icmp eq i32 %indvar, %3 +;CHECK-NEXT: br i1 %exitcond, label %for.cond.for.cond.cleanup_crit_edge, label %for.body + + %i.012 = phi i32 [ 0, %for.body.lr.ph ], [ %add3, %for.body ] + %S.addr.011 = phi i32 [ %S, %for.body.lr.ph ], [ %add2, %for.body ] + %a.addr.010 = phi i32* [ %a, %for.body.lr.ph ], [ %incdec.ptr1, %for.body ] + %incdec.ptr = getelementptr inbounds i32, i32* %a.addr.010, i64 1 + %0 = load i32, i32* %a.addr.010, align 4 + %add = add nsw i32 %0, %S.addr.011 + %incdec.ptr1 = getelementptr inbounds i32, i32* %a.addr.010, i64 2 + %1 = load i32, i32* %incdec.ptr, align 4 + %add2 = add nsw i32 %add, %1 + %add3 = add nsw i32 %i.012, 2 + %cmp = icmp slt i32 %add3, %N + br i1 %cmp, label %for.body, label %for.cond.for.cond.cleanup_crit_edge +} + +define i32 @test3(i32* nocapture readonly %buf, i32 %len) #0 { +entry: + %cmp10 = icmp sgt i32 %len, 1 + br i1 %cmp10, label %while.body.preheader, label %while.end + +while.body.preheader: ; preds = %entry + br label %while.body + +while.body: ; preds = %while.body.preheader, %while.body +;CHECK-LABEL: while.body: +;CHECK-NEXT: %indvar = phi i32 [ %indvar.next, %while.body ], [ 0, %while.body.preheader ] +;CHECK-NEXT: %S.012 = phi i32 [ %add, %while.body ], [ undef, %while.body.preheader ] +;CHECK-NEXT: %buf.addr.011 = phi i32* [ %add.ptr, %while.body ], [ %buf, %while.body.preheader ] +;CHECK-NEXT: %4 = load i32, i32* %buf.addr.011, align 4 +;CHECK-NEXT: %add = add nsw i32 %4, %S.012 +;CHECK-NEXT: %add.ptr = getelementptr inbounds i32, i32* %buf.addr.011, i64 -1 +;CHECK-NEXT: %indvar.next = add i32 %indvar, 1 +;CHECK-NEXT: %exitcond = icmp eq i32 %indvar, %3 +;CHECK-NEXT: br i1 %exitcond, label %while.end.loopexit, label %while.body + + %i.013 = phi i32 [ %sub, %while.body ], [ %len, %while.body.preheader ] + %S.012 = phi i32 [ %add2, %while.body ], [ undef, %while.body.preheader ] + %buf.addr.011 = phi i32* [ %add.ptr, %while.body ], [ %buf, %while.body.preheader ] + %0 = load i32, i32* %buf.addr.011, align 4 + %add = add nsw i32 %0, %S.012 + %arrayidx1 = getelementptr inbounds i32, i32* %buf.addr.011, i64 -1 + %1 = load i32, i32* %arrayidx1, align 4 + %add2 = add nsw i32 %add, %1 + %add.ptr = getelementptr inbounds i32, i32* %buf.addr.011, i64 -2 + %sub = add nsw i32 %i.013, -2 + %cmp = icmp sgt i32 %sub, 1 + br i1 %cmp, label %while.body, label %while.end.loopexit + +while.end.loopexit: ; preds = %while.body + br label %while.end + +while.end: ; preds = %while.end.loopexit, %entry + %S.0.lcssa = phi i32 [ undef, %entry ], [ %add2, %while.end.loopexit ] + ret i32 %S.0.lcssa +} + |