SLP Vectorizer: Fix a bug in the code that does CSE on the generated gather sequences.

Make sure that we don't replace and RAUW two sequences if one does not dominate the other. llvm-svn: 184674
author: Nadav Rotem <nrotem@apple.com> 2013-06-23 21:57:27 +0000
committer: Nadav Rotem <nrotem@apple.com> 2013-06-23 21:57:27 +0000
commit: 0323925d5116690be55ca4657da0b356108077fb (patch)
tree: ec6c5817797bc6fa93ef2df1f286d1ffe6c93a1b /llvm/test/Transforms/SLPVectorizer/X86/cse.ll
parent: 14e200d14d02fd36fd1ff1fd02b9b150ce170db8 (diff)
download: bcm5719-llvm-0323925d5116690be55ca4657da0b356108077fb.tar.gz
bcm5719-llvm-0323925d5116690be55ca4657da0b356108077fb.zip
1 files changed, 51 insertions, 0 deletions
diff --git a/llvm/test/Transforms/SLPVectorizer/X86/cse.ll b/llvm/test/Transforms/SLPVectorizer/X86/cse.ll
index 6321b007683..d286798d704 100644
--- a/llvm/test/Transforms/SLPVectorizer/X86/cse.ll
+++ b/llvm/test/Transforms/SLPVectorizer/X86/cse.ll
@@ -83,3 +83,54 @@ entry:
   ret i32 undef
 }
 
+; int test2(double *G, int k) {
+;   if (k) {
+;     G[0] = 1+G[5]*4;
+;     G[1] = 6+G[6]*3;
+;   } else {
+;     G[2] = 7+G[5]*4;
+;     G[3] = 8+G[6]*3;
+;   }
+; }
+
+; We can't merge the gather sequences because one does not dominate the other.
+; CHECK: test2
+; CHECK: insertelement
+; CHECK: insertelement
+; CHECK: insertelement
+; CHECK: insertelement
+; CHECK: ret
+define i32 @test2(double* nocapture %G, i32 %k) {
+  %1 = icmp eq i32 %k, 0
+  %2 = getelementptr inbounds double* %G, i64 5
+  %3 = load double* %2, align 8
+  %4 = fmul double %3, 4.000000e+00
+  br i1 %1, label %12, label %5
+
+; <label>:5                                       ; preds = %0
+  %6 = fadd double %4, 1.000000e+00
+  store double %6, double* %G, align 8
+  %7 = getelementptr inbounds double* %G, i64 6
+  %8 = load double* %7, align 8
+  %9 = fmul double %8, 3.000000e+00
+  %10 = fadd double %9, 6.000000e+00
+  %11 = getelementptr inbounds double* %G, i64 1
+  store double %10, double* %11, align 8
+  br label %20
+
+; <label>:12                                      ; preds = %0
+  %13 = fadd double %4, 7.000000e+00
+  %14 = getelementptr inbounds double* %G, i64 2
+  store double %13, double* %14, align 8
+  %15 = getelementptr inbounds double* %G, i64 6
+  %16 = load double* %15, align 8
+  %17 = fmul double %16, 3.000000e+00
+  %18 = fadd double %17, 8.000000e+00
+  %19 = getelementptr inbounds double* %G, i64 3
+  store double %18, double* %19, align 8
+  br label %20
+
+; <label>:20                                      ; preds = %12, %5
+  ret i32 undef
+}
+
author	Nadav Rotem <nrotem@apple.com>	2013-06-23 21:57:27 +0000
committer	Nadav Rotem <nrotem@apple.com>	2013-06-23 21:57:27 +0000
commit	0323925d5116690be55ca4657da0b356108077fb (patch)
tree	ec6c5817797bc6fa93ef2df1f286d1ffe6c93a1b /llvm/test/Transforms/SLPVectorizer/X86/cse.ll
parent	14e200d14d02fd36fd1ff1fd02b9b150ce170db8 (diff)
download	bcm5719-llvm-0323925d5116690be55ca4657da0b356108077fb.tar.gz bcm5719-llvm-0323925d5116690be55ca4657da0b356108077fb.zip