diff options
author | Renato Golin <renato.golin@linaro.org> | 2014-08-19 17:30:43 +0000 |
---|---|---|
committer | Renato Golin <renato.golin@linaro.org> | 2014-08-19 17:30:43 +0000 |
commit | dd6394d83344a3f61ddcf9fa0804308146d6b888 (patch) | |
tree | 1c3b1ca830bdf8fb64ee7c008bdc287d582c8069 /llvm/test/Transforms/LoopVectorize/duplicated-metadata.ll | |
parent | b25e7b42a977e0a31664ea0a34f4ffb9b37e5556 (diff) | |
download | bcm5719-llvm-dd6394d83344a3f61ddcf9fa0804308146d6b888.tar.gz bcm5719-llvm-dd6394d83344a3f61ddcf9fa0804308146d6b888.zip |
Small refactor on VectorizerHint for deduplication
Previously, the hint mechanism relied on clean up passes to remove redundant
metadata, which still showed up if running opt at low levels of optimization.
That also has shown that multiple nodes of the same type, but with different
values could still coexist, even if temporary, and cause confusion if the
next pass got the wrong value.
This patch makes sure that, if metadata already exists in a loop, the hint
mechanism will never append a new node, but always replace the existing one.
It also enhances the algorithm to cope with more metadata types in the future
by just adding a new type, not a lot of code.
llvm-svn: 215994
Diffstat (limited to 'llvm/test/Transforms/LoopVectorize/duplicated-metadata.ll')
-rw-r--r-- | llvm/test/Transforms/LoopVectorize/duplicated-metadata.ll | 30 |
1 files changed, 30 insertions, 0 deletions
diff --git a/llvm/test/Transforms/LoopVectorize/duplicated-metadata.ll b/llvm/test/Transforms/LoopVectorize/duplicated-metadata.ll new file mode 100644 index 00000000000..8353dca41cd --- /dev/null +++ b/llvm/test/Transforms/LoopVectorize/duplicated-metadata.ll @@ -0,0 +1,30 @@ +; RUN: opt < %s -loop-vectorize -S 2>&1 | FileCheck %s +target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" +target triple = "x86_64-unknown-linux-gnu" + +; This test makes sure we don't duplicate the loop vectorizer's metadata +; while marking them as already vectorized (by setting width = 1), even +; at lower optimization levels, where no extra cleanup is done + +define void @_Z3fooPf(float* %a) { +entry: + br label %for.body + +for.body: ; preds = %for.body, %entry + %indvars.iv = phi i64 [ 0, %entry ], [ %indvars.iv.next, %for.body ] + %arrayidx = getelementptr inbounds float* %a, i64 %indvars.iv + %p = load float* %arrayidx, align 4 + %mul = fmul float %p, 2.000000e+00 + store float %mul, float* %arrayidx, align 4 + %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1 + %exitcond = icmp eq i64 %indvars.iv.next, 1024 + br i1 %exitcond, label %for.end, label %for.body, !llvm.loop !0 + +for.end: ; preds = %for.body + ret void +} + +!0 = metadata !{metadata !0, metadata !1} +!1 = metadata !{metadata !"llvm.loop.vectorize.width", i32 4} +; CHECK-NOT: !{metadata !"llvm.loop.vectorize.width", i32 4} +; CHECK: !{metadata !"llvm.loop.interleave.count", i32 1} |