diff options
Diffstat (limited to 'llvm/test/Transforms/LoopVectorize')
-rw-r--r-- | llvm/test/Transforms/LoopVectorize/pr30806-phi-scev.ll | 66 | ||||
-rw-r--r-- | llvm/test/Transforms/LoopVectorize/pr30806.ll | 65 |
2 files changed, 131 insertions, 0 deletions
diff --git a/llvm/test/Transforms/LoopVectorize/pr30806-phi-scev.ll b/llvm/test/Transforms/LoopVectorize/pr30806-phi-scev.ll new file mode 100644 index 00000000000..e04bdd6607d --- /dev/null +++ b/llvm/test/Transforms/LoopVectorize/pr30806-phi-scev.ll @@ -0,0 +1,66 @@ +; RUN: opt -S -indvars < %s | FileCheck %s + +; Produced from the test-case: +; +; extern void foo(char *, unsigned , unsigned *); +; extern void bar(int *, long); +; extern char *processBuf(char *); +; +; extern unsigned theSize; +; +; void foo(char *buf, unsigned denominator, unsigned *flag) { +; int incr = (int) (theSize / denominator); +; int inx = 0; +; while (*flag) { +; int itmp = inx + incr; +; int i = (int) theSize; +; bar(&i, (long) itmp); +; buf = processBuf(buf); +; inx = itmp; +; } +; } + +target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" + +@theSize = external local_unnamed_addr global i32, align 4 + +define void @foo(i8* %buf, i32 %denominator, i32* %flag) local_unnamed_addr { +entry: + %i = alloca i32, align 4 + %0 = load i32, i32* @theSize, align 4 + %div = udiv i32 %0, %denominator + %1 = load i32, i32* %flag, align 4 + %tobool5 = icmp eq i32 %1, 0 + br i1 %tobool5, label %while.end, label %while.body.lr.ph + +while.body.lr.ph: ; preds = %entry + %2 = bitcast i32* %i to i8* + br label %while.body + +while.body: ; preds = %while.body.lr.ph, %while.body +; Check that there are two PHIs followed by a 'sext' in the same block, and that +; the test does not crash. +; CHECK: phi +; CHECK-NEXT: phi +; CHECK-NEXT: sext + %buf.addr.07 = phi i8* [ %buf, %while.body.lr.ph ], [ %call, %while.body ] + %inx.06 = phi i32 [ 0, %while.body.lr.ph ], [ %add, %while.body ] + %add = add nsw i32 %inx.06, %div + %3 = load i32, i32* @theSize, align 4 + store i32 %3, i32* %i, align 4 + %conv = sext i32 %add to i64 + call void @bar(i32* nonnull %i, i64 %conv) + %call = call i8* @processBuf(i8* %buf.addr.07) + %4 = load i32, i32* %flag, align 4 + %tobool = icmp eq i32 %4, 0 + br i1 %tobool, label %while.end.loopexit, label %while.body + +while.end.loopexit: ; preds = %while.body + br label %while.end + +while.end: ; preds = %while.end.loopexit, %entry + ret void +} + +declare void @bar(i32*, i64) local_unnamed_addr +declare i8* @processBuf(i8*) local_unnamed_addr diff --git a/llvm/test/Transforms/LoopVectorize/pr30806.ll b/llvm/test/Transforms/LoopVectorize/pr30806.ll new file mode 100644 index 00000000000..dd9f6629413 --- /dev/null +++ b/llvm/test/Transforms/LoopVectorize/pr30806.ll @@ -0,0 +1,65 @@ +; RUN: opt -loop-vectorize -S < %s 2>&1 | FileCheck %s + +; Produced from test-case: +; +; void testGuardedInnerLoop(uint32_t *ptr, uint32_t denom, uint32_t numer, uint32_t outer_lim) +; { +; for(uint32_t outer_i = 0; outer_i < outer_lim; ++outer_i) { +; if (denom > 0) { +; const uint32_t lim = numer / denom; +; +; for (uint32_t i = 0; i < lim; ++i) +; ptr[i] = 1; +; } +; } +; } + + +target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128-ni:1" +target triple = "x86_64-unknown-linux-gnu" + +define void @testGuardedInnerLoop(i32* %ptr, i32 %denom, i32 %numer, i32 %outer_lim) { +entry: + %cmp1 = icmp eq i32 %outer_lim, 0 + br i1 %cmp1, label %exit, label %loop1.preheader + +; Verify that a 'udiv' does not appear between the 'loop1.preheader' label, and +; whatever label comes next. +loop1.preheader: +; CHECK-LABEL: loop1.preheader: +; CHECK-NOT: udiv +; CHECK-LABEL: : + br label %loop1 + +loop1: + %outer_i = phi i32 [ %inc1, %loop2.exit ], [ 0, %loop1.preheader ] + %0 = add i32 %denom, -1 + %1 = icmp ult i32 %0, %numer + br i1 %1, label %loop2.preheader, label %loop2.exit + +; Verify that a 'udiv' does appear between the 'loop2.preheader' label, and +; whatever label comes next. +loop2.preheader: +; CHECK-LABEL: loop2.preheader: +; CHECK: udiv +; CHECK-LABEL: : + %lim = udiv i32 %numer, %denom + %2 = zext i32 %lim to i64 + br label %loop2 + +loop2: + %indvar.loop2 = phi i64 [ 0, %loop2.preheader ], [ %indvar.loop2.next, %loop2 ] + %arrayidx = getelementptr inbounds i32, i32* %ptr, i64 %indvar.loop2 + store i32 1, i32* %arrayidx, align 4 + %indvar.loop2.next = add nuw nsw i64 %indvar.loop2, 1 + %cmp2 = icmp ult i64 %indvar.loop2.next, %2 + br i1 %cmp2, label %loop2, label %loop2.exit + +loop2.exit: + %inc1 = add nuw i32 %outer_i, 1 + %exitcond = icmp eq i32 %inc1, %outer_lim + br i1 %exitcond, label %exit, label %loop1 + +exit: + ret void +} |