summaryrefslogtreecommitdiffstats
path: root/llvm/test
diff options
context:
space:
mode:
authorDiego Caballero <diego.caballero@intel.com>2018-06-15 16:21:35 +0000
committerDiego Caballero <diego.caballero@intel.com>2018-06-15 16:21:35 +0000
commit68795245cfb3ca1d3c6ddb7e87ed8165de20dbef (patch)
treef38d08087348c1c1db404c66afee7183a797398c /llvm/test
parent6927cf0c2ae41e607883c453ce81f82bb922ff48 (diff)
downloadbcm5719-llvm-68795245cfb3ca1d3c6ddb7e87ed8165de20dbef.tar.gz
bcm5719-llvm-68795245cfb3ca1d3c6ddb7e87ed8165de20dbef.zip
[LV] Prevent LV to run cost model twice for VF=2
This is a minor fix for LV cost model, where the cost for VF=2 was computed twice when the vectorization of the loop was forced without specifying a VF. Reviewers: xusx595, hsaito, fhahn, mkuper Reviewed By: hsaito, xusx595 Differential Revision: https://reviews.llvm.org/D48048 llvm-svn: 334840
Diffstat (limited to 'llvm/test')
-rw-r--r--llvm/test/Transforms/LoopVectorize/redundant-vf2-cost.ll34
1 files changed, 34 insertions, 0 deletions
diff --git a/llvm/test/Transforms/LoopVectorize/redundant-vf2-cost.ll b/llvm/test/Transforms/LoopVectorize/redundant-vf2-cost.ll
new file mode 100644
index 00000000000..bd69d27d2d5
--- /dev/null
+++ b/llvm/test/Transforms/LoopVectorize/redundant-vf2-cost.ll
@@ -0,0 +1,34 @@
+; RUN: opt < %s -loop-vectorize -mtriple x86_64 -debug -disable-output 2>&1 | FileCheck %s
+; REQUIRES: asserts
+
+; Check that cost model is not executed twice for VF=2 when vectorization is
+; forced for a particular loop.
+
+; CHECK: LV: Found an estimated cost of {{[0-9]+}} for VF 2 For instruction: %{{[0-9]+}} = load i32
+; CHECK: LV: Found an estimated cost of {{[0-9]+}} for VF 2 For instruction: store i32
+; CHECK-NOT: LV: Found an estimated cost of {{[0-9]+}} for VF 2 For instruction: %{{[0-9]+}} = load i32
+; CHECK-NOT: LV: Found an estimated cost of {{[0-9]+}} for VF 2 For instruction: store i32
+; CHECK: LV: Vector loop of width 2 costs: {{[0-9]+}}.
+
+define i32 @foo(i32* %A, i32 %n) {
+entry:
+ %cmp3.i = icmp eq i32 %n, 0
+ br i1 %cmp3.i, label %exit, label %for.body.i
+
+for.body.i:
+ %iv = phi i32 [ %add.i, %for.body.i ], [ 0, %entry ]
+ %ld_addr = getelementptr inbounds i32, i32* %A, i32 %iv
+ %0 = load i32, i32* %ld_addr, align 4
+ %val = add i32 %0, 1
+ store i32 %val, i32* %ld_addr, align 4
+ %add.i = add nsw i32 %iv, 1
+ %cmp.i = icmp eq i32 %add.i, %n
+ br i1 %cmp.i, label %exit, label %for.body.i, !llvm.loop !0
+
+exit:
+ %__init.addr.0.lcssa.i = phi i32 [ 0, %entry ], [ %add.i, %for.body.i ]
+ ret i32 %__init.addr.0.lcssa.i
+}
+
+!0 = !{!0, !1}
+!1 = !{!"llvm.loop.vectorize.enable", i1 true}
OpenPOWER on IntegriCloud