summaryrefslogtreecommitdiffstats
path: root/llvm/test/Transforms/IPConstantProp/openmp_parallel_for.ll
diff options
context:
space:
mode:
Diffstat (limited to 'llvm/test/Transforms/IPConstantProp/openmp_parallel_for.ll')
-rw-r--r--llvm/test/Transforms/IPConstantProp/openmp_parallel_for.ll120
1 files changed, 120 insertions, 0 deletions
diff --git a/llvm/test/Transforms/IPConstantProp/openmp_parallel_for.ll b/llvm/test/Transforms/IPConstantProp/openmp_parallel_for.ll
new file mode 100644
index 00000000000..3c7ffe27f5d
--- /dev/null
+++ b/llvm/test/Transforms/IPConstantProp/openmp_parallel_for.ll
@@ -0,0 +1,120 @@
+; RUN: opt -S -ipconstprop < %s | FileCheck %s
+;
+; void bar(int, float, double);
+;
+; void foo(int N) {
+; float p = 3;
+; double q = 5;
+; N = 7;
+;
+; #pragma omp parallel for firstprivate(q)
+; for (int i = 2; i < N; i++) {
+; bar(i, p, q);
+; }
+; }
+;
+; Verify the constant value of q is propagated into the outlined function.
+;
+target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
+
+%struct.ident_t = type { i32, i32, i32, i32, i8* }
+
+@.str = private unnamed_addr constant [23 x i8] c";unknown;unknown;0;0;;\00", align 1
+@0 = private unnamed_addr global %struct.ident_t { i32 0, i32 514, i32 0, i32 0, i8* getelementptr inbounds ([23 x i8], [23 x i8]* @.str, i32 0, i32 0) }, align 8
+@1 = private unnamed_addr global %struct.ident_t { i32 0, i32 2, i32 0, i32 0, i8* getelementptr inbounds ([23 x i8], [23 x i8]* @.str, i32 0, i32 0) }, align 8
+
+define dso_local void @foo(i32 %N) {
+entry:
+ %N.addr = alloca i32, align 4
+ %p = alloca float, align 4
+ store i32 %N, i32* %N.addr, align 4
+ store float 3.000000e+00, float* %p, align 4
+ store i32 7, i32* %N.addr, align 4
+ call void (%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...) @__kmpc_fork_call(%struct.ident_t* nonnull @1, i32 3, void (i32*, i32*, ...)* bitcast (void (i32*, i32*, i32*, float*, i64)* @.omp_outlined. to void (i32*, i32*, ...)*), i32* nonnull %N.addr, float* nonnull %p, i64 4617315517961601024)
+ ret void
+}
+
+define internal void @.omp_outlined.(i32* noalias %.global_tid., i32* noalias %.bound_tid., i32* dereferenceable(4) %N, float* dereferenceable(4) %p, i64 %q) {
+entry:
+ %q.addr = alloca i64, align 8
+ %.omp.lb = alloca i32, align 4
+ %.omp.ub = alloca i32, align 4
+ %.omp.stride = alloca i32, align 4
+ %.omp.is_last = alloca i32, align 4
+; CHECK: store i64 4617315517961601024, i64* %q.addr, align 8
+ store i64 %q, i64* %q.addr, align 8
+ %conv = bitcast i64* %q.addr to double*
+ %tmp = load i32, i32* %N, align 4
+ %sub3 = add nsw i32 %tmp, -3
+ %cmp = icmp sgt i32 %tmp, 2
+ br i1 %cmp, label %omp.precond.then, label %omp.precond.end
+
+omp.precond.then: ; preds = %entry
+ store i32 0, i32* %.omp.lb, align 4
+ store i32 %sub3, i32* %.omp.ub, align 4
+ store i32 1, i32* %.omp.stride, align 4
+ store i32 0, i32* %.omp.is_last, align 4
+ %tmp5 = load i32, i32* %.global_tid., align 4
+ call void @__kmpc_for_static_init_4(%struct.ident_t* nonnull @0, i32 %tmp5, i32 34, i32* nonnull %.omp.is_last, i32* nonnull %.omp.lb, i32* nonnull %.omp.ub, i32* nonnull %.omp.stride, i32 1, i32 1)
+ %tmp6 = load i32, i32* %.omp.ub, align 4
+ %cmp6 = icmp sgt i32 %tmp6, %sub3
+ br i1 %cmp6, label %cond.true, label %cond.false
+
+cond.true: ; preds = %omp.precond.then
+ br label %cond.end
+
+cond.false: ; preds = %omp.precond.then
+ %tmp7 = load i32, i32* %.omp.ub, align 4
+ br label %cond.end
+
+cond.end: ; preds = %cond.false, %cond.true
+ %cond = phi i32 [ %sub3, %cond.true ], [ %tmp7, %cond.false ]
+ store i32 %cond, i32* %.omp.ub, align 4
+ %tmp8 = load i32, i32* %.omp.lb, align 4
+ br label %omp.inner.for.cond
+
+omp.inner.for.cond: ; preds = %omp.inner.for.inc, %cond.end
+ %.omp.iv.0 = phi i32 [ %tmp8, %cond.end ], [ %add11, %omp.inner.for.inc ]
+ %tmp9 = load i32, i32* %.omp.ub, align 4
+ %cmp8 = icmp sgt i32 %.omp.iv.0, %tmp9
+ br i1 %cmp8, label %omp.inner.for.cond.cleanup, label %omp.inner.for.body
+
+omp.inner.for.cond.cleanup: ; preds = %omp.inner.for.cond
+ br label %omp.inner.for.end
+
+omp.inner.for.body: ; preds = %omp.inner.for.cond
+ %add10 = add nsw i32 %.omp.iv.0, 2
+ %tmp10 = load float, float* %p, align 4
+ %tmp11 = load double, double* %conv, align 8
+ call void @bar(i32 %add10, float %tmp10, double %tmp11)
+ br label %omp.body.continue
+
+omp.body.continue: ; preds = %omp.inner.for.body
+ br label %omp.inner.for.inc
+
+omp.inner.for.inc: ; preds = %omp.body.continue
+ %add11 = add nsw i32 %.omp.iv.0, 1
+ br label %omp.inner.for.cond
+
+omp.inner.for.end: ; preds = %omp.inner.for.cond.cleanup
+ br label %omp.loop.exit
+
+omp.loop.exit: ; preds = %omp.inner.for.end
+ %tmp12 = load i32, i32* %.global_tid., align 4
+ call void @__kmpc_for_static_fini(%struct.ident_t* nonnull @0, i32 %tmp12)
+ br label %omp.precond.end
+
+omp.precond.end: ; preds = %omp.loop.exit, %entry
+ ret void
+}
+
+declare dso_local void @__kmpc_for_static_init_4(%struct.ident_t*, i32, i32, i32*, i32*, i32*, i32*, i32, i32)
+
+declare dso_local void @bar(i32, float, double)
+
+declare dso_local void @__kmpc_for_static_fini(%struct.ident_t*, i32)
+
+declare !callback !0 dso_local void @__kmpc_fork_call(%struct.ident_t*, i32, void (i32*, i32*, ...)*, ...)
+
+!1 = !{i64 2, i64 -1, i64 -1, i1 true}
+!0 = !{!1}
OpenPOWER on IntegriCloud