diff options
author | Dmitri Gribenko <gribozavr@gmail.com> | 2019-10-14 12:22:48 +0000 |
---|---|---|
committer | Dmitri Gribenko <gribozavr@gmail.com> | 2019-10-14 12:22:48 +0000 |
commit | 1a21f98ac3c57d027908000b8bac356daec51416 (patch) | |
tree | 9ed8a7cdea6b2580e007cf82401073f4ffff08ba /llvm/test | |
parent | c4d256a59049d4b2f21da83f43b9caba2427885e (diff) | |
download | bcm5719-llvm-1a21f98ac3c57d027908000b8bac356daec51416.tar.gz bcm5719-llvm-1a21f98ac3c57d027908000b8bac356daec51416.zip |
Revert "Add a pass to lower is.constant and objectsize intrinsics"
This reverts commit r374743. It broke the build with Ocaml enabled:
http://lab.llvm.org:8011/builders/clang-x86_64-debian-fast/builds/19218
llvm-svn: 374768
Diffstat (limited to 'llvm/test')
19 files changed, 390 insertions, 135 deletions
diff --git a/llvm/test/CodeGen/AArch64/GlobalISel/arm64-irtranslator.ll b/llvm/test/CodeGen/AArch64/GlobalISel/arm64-irtranslator.ll index 598510df98a..4f9dcd1686a 100644 --- a/llvm/test/CodeGen/AArch64/GlobalISel/arm64-irtranslator.ll +++ b/llvm/test/CodeGen/AArch64/GlobalISel/arm64-irtranslator.ll @@ -1183,6 +1183,23 @@ define void @test_memset(i8* %dst, i8 %val, i64 %size) { ret void } +declare i64 @llvm.objectsize.i64(i8*, i1) +declare i32 @llvm.objectsize.i32(i8*, i1) +define void @test_objectsize(i8* %addr0, i8* %addr1) { +; CHECK-LABEL: name: test_objectsize +; CHECK: [[ADDR0:%[0-9]+]]:_(p0) = COPY $x0 +; CHECK: [[ADDR1:%[0-9]+]]:_(p0) = COPY $x1 +; CHECK: {{%[0-9]+}}:_(s64) = G_CONSTANT i64 -1 +; CHECK: {{%[0-9]+}}:_(s64) = G_CONSTANT i64 0 +; CHECK: {{%[0-9]+}}:_(s32) = G_CONSTANT i32 -1 +; CHECK: {{%[0-9]+}}:_(s32) = G_CONSTANT i32 0 + %size64.0 = call i64 @llvm.objectsize.i64(i8* %addr0, i1 0) + %size64.intmin = call i64 @llvm.objectsize.i64(i8* %addr0, i1 1) + %size32.0 = call i32 @llvm.objectsize.i32(i8* %addr0, i1 0) + %size32.intmin = call i32 @llvm.objectsize.i32(i8* %addr0, i1 1) + ret void +} + define void @test_large_const(i128* %addr) { ; CHECK-LABEL: name: test_large_const ; CHECK: [[ADDR:%[0-9]+]]:_(p0) = COPY $x0 diff --git a/llvm/test/CodeGen/AArch64/O0-pipeline.ll b/llvm/test/CodeGen/AArch64/O0-pipeline.ll index 20214fb83f4..9611946f710 100644 --- a/llvm/test/CodeGen/AArch64/O0-pipeline.ll +++ b/llvm/test/CodeGen/AArch64/O0-pipeline.ll @@ -21,7 +21,6 @@ ; CHECK-NEXT: Module Verifier ; CHECK-NEXT: Lower Garbage Collection Instructions ; CHECK-NEXT: Shadow Stack GC Lowering -; CHECK-NEXT: Lower constant intrinsics ; CHECK-NEXT: Remove unreachable blocks from the CFG ; CHECK-NEXT: Instrument function entry/exit with calls to e.g. mcount() (post inlining) ; CHECK-NEXT: Scalarize Masked Memory Intrinsics diff --git a/llvm/test/CodeGen/AArch64/O3-pipeline.ll b/llvm/test/CodeGen/AArch64/O3-pipeline.ll index f483d631167..35417deec1a 100644 --- a/llvm/test/CodeGen/AArch64/O3-pipeline.ll +++ b/llvm/test/CodeGen/AArch64/O3-pipeline.ll @@ -38,7 +38,6 @@ ; CHECK-NEXT: Expand memcmp() to load/stores ; CHECK-NEXT: Lower Garbage Collection Instructions ; CHECK-NEXT: Shadow Stack GC Lowering -; CHECK-NEXT: Lower constant intrinsics ; CHECK-NEXT: Remove unreachable blocks from the CFG ; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Natural Loop Information diff --git a/llvm/test/CodeGen/ARM/O3-pipeline.ll b/llvm/test/CodeGen/ARM/O3-pipeline.ll index 6cc7e53aeff..cbfc1e86a36 100644 --- a/llvm/test/CodeGen/ARM/O3-pipeline.ll +++ b/llvm/test/CodeGen/ARM/O3-pipeline.ll @@ -22,7 +22,6 @@ ; CHECK-NEXT: Expand memcmp() to load/stores ; CHECK-NEXT: Lower Garbage Collection Instructions ; CHECK-NEXT: Shadow Stack GC Lowering -; CHECK-NEXT: Lower constant intrinsics ; CHECK-NEXT: Remove unreachable blocks from the CFG ; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Natural Loop Information diff --git a/llvm/test/CodeGen/Generic/is-constant.ll b/llvm/test/CodeGen/Generic/is-constant.ll new file mode 100644 index 00000000000..2e1f4261d6a --- /dev/null +++ b/llvm/test/CodeGen/Generic/is-constant.ll @@ -0,0 +1,114 @@ +; RUN: opt -O2 -S < %s | FileCheck %s +; RUN: llc -o /dev/null 2>&1 < %s +; RUN: llc -O0 -o /dev/null 2>&1 < %s + +;; The llc runs above are just to ensure it doesn't blow up upon +;; seeing an is_constant intrinsic. + +declare i1 @llvm.is.constant.i32(i32 %a) +declare i1 @llvm.is.constant.i64(i64 %a) +declare i1 @llvm.is.constant.i256(i256 %a) +declare i1 @llvm.is.constant.v2i64(<2 x i64> %a) +declare i1 @llvm.is.constant.f32(float %a) +declare i1 @llvm.is.constant.sl_i32i32s({i32, i32} %a) +declare i1 @llvm.is.constant.a2i64([2 x i64] %a) +declare i1 @llvm.is.constant.p0i64(i64* %a) + +;; Basic test that optimization folds away the is.constant when given +;; a constant. +define i1 @test_constant() #0 { +; CHECK-LABEL: @test_constant( +; CHECK-NOT: llvm.is.constant +; CHECK: ret i1 true +%y = call i1 @llvm.is.constant.i32(i32 44) + ret i1 %y +} + +;; And test that the intrinsic sticks around when given a +;; non-constant. +define i1 @test_nonconstant(i32 %x) #0 { +; CHECK-LABEL: @test_nonconstant( +; CHECK: @llvm.is.constant + %y = call i1 @llvm.is.constant.i32(i32 %x) + ret i1 %y +} + +;; Ensure that nested is.constants fold. +define i32 @test_nested() #0 { +; CHECK-LABEL: @test_nested( +; CHECK-NOT: llvm.is.constant +; CHECK: ret i32 13 + %val1 = call i1 @llvm.is.constant.i32(i32 27) + %val2 = zext i1 %val1 to i32 + %val3 = add i32 %val2, 12 + %1 = call i1 @llvm.is.constant.i32(i32 %val3) + %2 = zext i1 %1 to i32 + %3 = add i32 %2, 12 + ret i32 %3 +} + +@G = global [2 x i64] zeroinitializer +define i1 @test_global() #0 { +; CHECK-LABEL: @test_global( +; CHECK: llvm.is.constant + %ret = call i1 @llvm.is.constant.p0i64(i64* getelementptr ([2 x i64], [2 x i64]* @G, i32 0, i32 0)) + ret i1 %ret +} + +define i1 @test_diff() #0 { +; CHECK-LABEL: @test_diff( + %ret = call i1 @llvm.is.constant.i64(i64 sub ( + i64 ptrtoint (i64* getelementptr inbounds ([2 x i64], [2 x i64]* @G, i64 0, i64 1) to i64), + i64 ptrtoint ([2 x i64]* @G to i64))) + ret i1 %ret +} + +define i1 @test_various_types(i256 %int, float %float, <2 x i64> %vec, {i32, i32} %struct, [2 x i64] %arr, i64* %ptr) #0 { +; CHECK-LABEL: @test_various_types( +; CHECK: llvm.is.constant +; CHECK: llvm.is.constant +; CHECK: llvm.is.constant +; CHECK: llvm.is.constant +; CHECK: llvm.is.constant +; CHECK: llvm.is.constant +; CHECK-NOT: llvm.is.constant + %v1 = call i1 @llvm.is.constant.i256(i256 %int) + %v2 = call i1 @llvm.is.constant.f32(float %float) + %v3 = call i1 @llvm.is.constant.v2i64(<2 x i64> %vec) + %v4 = call i1 @llvm.is.constant.sl_i32i32s({i32, i32} %struct) + %v5 = call i1 @llvm.is.constant.a2i64([2 x i64] %arr) + %v6 = call i1 @llvm.is.constant.p0i64(i64* %ptr) + + %c1 = call i1 @llvm.is.constant.i256(i256 -1) + %c2 = call i1 @llvm.is.constant.f32(float 17.0) + %c3 = call i1 @llvm.is.constant.v2i64(<2 x i64> <i64 -1, i64 44>) + %c4 = call i1 @llvm.is.constant.sl_i32i32s({i32, i32} {i32 -1, i32 32}) + %c5 = call i1 @llvm.is.constant.a2i64([2 x i64] [i64 -1, i64 32]) + %c6 = call i1 @llvm.is.constant.p0i64(i64* inttoptr (i32 42 to i64*)) + + %x1 = add i1 %v1, %c1 + %x2 = add i1 %v2, %c2 + %x3 = add i1 %v3, %c3 + %x4 = add i1 %v4, %c4 + %x5 = add i1 %v5, %c5 + %x6 = add i1 %v6, %c6 + + %res2 = add i1 %x1, %x2 + %res3 = add i1 %res2, %x3 + %res4 = add i1 %res3, %x4 + %res5 = add i1 %res4, %x5 + %res6 = add i1 %res5, %x6 + + ret i1 %res6 +} + +define i1 @test_various_types2() #0 { +; CHECK-LABEL: @test_various_types2( +; CHECK: ret i1 false + %r = call i1 @test_various_types(i256 -1, float 22.0, <2 x i64> <i64 -1, i64 44>, + {i32, i32} {i32 -1, i32 55}, [2 x i64] [i64 -1, i64 55], + i64* inttoptr (i64 42 to i64*)) + ret i1 %r +} + +attributes #0 = { nounwind uwtable } diff --git a/llvm/test/CodeGen/X86/O0-pipeline.ll b/llvm/test/CodeGen/X86/O0-pipeline.ll index b6e1e459c2d..271aec5fa05 100644 --- a/llvm/test/CodeGen/X86/O0-pipeline.ll +++ b/llvm/test/CodeGen/X86/O0-pipeline.ll @@ -24,7 +24,6 @@ ; CHECK-NEXT: Module Verifier ; CHECK-NEXT: Lower Garbage Collection Instructions ; CHECK-NEXT: Shadow Stack GC Lowering -; CHECK-NEXT: Lower constant intrinsics ; CHECK-NEXT: Remove unreachable blocks from the CFG ; CHECK-NEXT: Instrument function entry/exit with calls to e.g. mcount() (post inlining) ; CHECK-NEXT: Scalarize Masked Memory Intrinsics diff --git a/llvm/test/CodeGen/X86/O3-pipeline.ll b/llvm/test/CodeGen/X86/O3-pipeline.ll index 389c21f0a8f..d7569ccb2da 100644 --- a/llvm/test/CodeGen/X86/O3-pipeline.ll +++ b/llvm/test/CodeGen/X86/O3-pipeline.ll @@ -35,7 +35,6 @@ ; CHECK-NEXT: Expand memcmp() to load/stores ; CHECK-NEXT: Lower Garbage Collection Instructions ; CHECK-NEXT: Shadow Stack GC Lowering -; CHECK-NEXT: Lower constant intrinsics ; CHECK-NEXT: Remove unreachable blocks from the CFG ; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Natural Loop Information diff --git a/llvm/test/CodeGen/X86/is-constant.ll b/llvm/test/CodeGen/X86/is-constant.ll new file mode 100644 index 00000000000..b4c1f351a2a --- /dev/null +++ b/llvm/test/CodeGen/X86/is-constant.ll @@ -0,0 +1,50 @@ +; RUN: llc -O2 < %s | FileCheck %s --check-prefix=CHECK-O2 --check-prefix=CHECK +; RUN: llc -O0 -fast-isel < %s | FileCheck %s --check-prefix=CHECK-O0 --check-prefix=CHECK +; RUN: llc -O0 -fast-isel=0 < %s | FileCheck %s --check-prefix=CHECK-O0 --check-prefix=CHECK +; RUN: llc -O0 -global-isel < %s | FileCheck %s --check-prefix=CHECK-O0 --check-prefix=CHECK + +;; Ensure that an unfoldable is.constant gets lowered reasonably in +;; optimized codegen, in particular, that the "true" branch is +;; eliminated. +;; +;; This isn't asserting any specific output from non-optimized runs, +;; (e.g., currently the not-taken branch does not get eliminated). But +;; it does ensure that lowering succeeds in all 3 codegen paths. + +target triple = "x86_64-unknown-linux-gnu" + +declare i1 @llvm.is.constant.i32(i32 %a) nounwind readnone +declare i1 @llvm.is.constant.i64(i64 %a) nounwind readnone +declare i64 @llvm.objectsize.i64.p0i8(i8*, i1, i1, i1) nounwind readnone + +declare i32 @subfun_1() +declare i32 @subfun_2() + +define i32 @test_branch(i32 %in) nounwind { +; CHECK-LABEL: test_branch: +; CHECK-O2: %bb.0: +; CHECK-O2-NEXT: jmp subfun_2 + %v = call i1 @llvm.is.constant.i32(i32 %in) + br i1 %v, label %True, label %False + +True: + %call1 = tail call i32 @subfun_1() + ret i32 %call1 + +False: + %call2 = tail call i32 @subfun_2() + ret i32 %call2 +} + +;; llvm.objectsize is another tricky case which gets folded to -1 very +;; late in the game. We'd like to ensure that llvm.is.constant of +;; llvm.objectsize is true. +define i1 @test_objectsize(i8* %obj) nounwind { +; CHECK-LABEL: test_objectsize: +; CHECK-O2: %bb.0: +; CHECK-O2: movb $1, %al +; CHECK-O2-NEXT: retq + %os = call i64 @llvm.objectsize.i64.p0i8(i8* %obj, i1 false, i1 false, i1 false) + %v = call i1 @llvm.is.constant.i64(i64 %os) + ret i1 %v +} diff --git a/llvm/test/CodeGen/X86/object-size.ll b/llvm/test/CodeGen/X86/object-size.ll new file mode 100644 index 00000000000..b795e0fda8b --- /dev/null +++ b/llvm/test/CodeGen/X86/object-size.ll @@ -0,0 +1,55 @@ +; RUN: llc -O0 < %s | FileCheck %s + +; ModuleID = 'ts.c' +target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64" +target triple = "x86_64-apple-darwin10.0" + +@p = common global i8* null, align 8 ; <i8**> [#uses=4] +@.str = private constant [3 x i8] c"Hi\00" ; <[3 x i8]*> [#uses=1] + +define void @bar() nounwind ssp { +entry: + %tmp = load i8*, i8** @p ; <i8*> [#uses=1] + %0 = call i64 @llvm.objectsize.i64.p0i8(i8* %tmp, i1 0) ; <i64> [#uses=1] + %cmp = icmp ne i64 %0, -1 ; <i1> [#uses=1] +; CHECK: movq $-1, [[RAX:%r..]] +; CHECK: cmpq $-1, [[RAX]] + br i1 %cmp, label %cond.true, label %cond.false + +cond.true: ; preds = %entry + %tmp1 = load i8*, i8** @p ; <i8*> [#uses=1] + %tmp2 = load i8*, i8** @p ; <i8*> [#uses=1] + %1 = call i64 @llvm.objectsize.i64.p0i8(i8* %tmp2, i1 1) ; <i64> [#uses=1] + %call = call i8* @__strcpy_chk(i8* %tmp1, i8* getelementptr inbounds ([3 x i8], [3 x i8]* @.str, i32 0, i32 0), i64 %1) ssp ; <i8*> [#uses=1] + br label %cond.end + +cond.false: ; preds = %entry + %tmp3 = load i8*, i8** @p ; <i8*> [#uses=1] + %call4 = call i8* @__inline_strcpy_chk(i8* %tmp3, i8* getelementptr inbounds ([3 x i8], [3 x i8]* @.str, i32 0, i32 0)) ssp ; <i8*> [#uses=1] + br label %cond.end + +cond.end: ; preds = %cond.false, %cond.true + %cond = phi i8* [ %call, %cond.true ], [ %call4, %cond.false ] ; <i8*> [#uses=0] + ret void +} + +declare i64 @llvm.objectsize.i64.p0i8(i8*, i1) nounwind readonly + +declare i8* @__strcpy_chk(i8*, i8*, i64) ssp + +define internal i8* @__inline_strcpy_chk(i8* %__dest, i8* %__src) nounwind ssp { +entry: + %retval = alloca i8* ; <i8**> [#uses=2] + %__dest.addr = alloca i8* ; <i8**> [#uses=3] + %__src.addr = alloca i8* ; <i8**> [#uses=2] + store i8* %__dest, i8** %__dest.addr + store i8* %__src, i8** %__src.addr + %tmp = load i8*, i8** %__dest.addr ; <i8*> [#uses=1] + %tmp1 = load i8*, i8** %__src.addr ; <i8*> [#uses=1] + %tmp2 = load i8*, i8** %__dest.addr ; <i8*> [#uses=1] + %0 = call i64 @llvm.objectsize.i64.p0i8(i8* %tmp2, i1 1) ; <i64> [#uses=1] + %call = call i8* @__strcpy_chk(i8* %tmp, i8* %tmp1, i64 %0) ssp ; <i8*> [#uses=1] + store i8* %call, i8** %retval + %1 = load i8*, i8** %retval ; <i8*> [#uses=1] + ret i8* %1 +} diff --git a/llvm/test/Other/new-pm-defaults.ll b/llvm/test/Other/new-pm-defaults.ll index 638c783725b..4e07bffd3dc 100644 --- a/llvm/test/Other/new-pm-defaults.ll +++ b/llvm/test/Other/new-pm-defaults.ll @@ -231,7 +231,6 @@ ; CHECK-O-NEXT: Running pass: ModuleToFunctionPassAdaptor<{{.*}}PassManager{{.*}}> ; CHECK-O-NEXT: Starting llvm::Function pass manager run. ; CHECK-O-NEXT: Running pass: Float2IntPass -; CHECK-O-NEXT: Running pass: LowerConstantIntrinsicsPass on foo ; CHECK-EP-VECTORIZER-START-NEXT: Running pass: NoOpFunctionPass ; CHECK-O-NEXT: Running pass: FunctionToLoopPassAdaptor<{{.*}}LoopRotatePass ; CHECK-O-NEXT: Starting llvm::Function pass manager run. diff --git a/llvm/test/Other/new-pm-thinlto-defaults.ll b/llvm/test/Other/new-pm-thinlto-defaults.ll index 7b6855b130e..686bb9b6ea9 100644 --- a/llvm/test/Other/new-pm-thinlto-defaults.ll +++ b/llvm/test/Other/new-pm-thinlto-defaults.ll @@ -205,7 +205,6 @@ ; CHECK-POSTLINK-O-NEXT: Running pass: ModuleToFunctionPassAdaptor<{{.*}}PassManager{{.*}}> ; CHECK-POSTLINK-O-NEXT: Starting llvm::Function pass manager run. ; CHECK-POSTLINK-O-NEXT: Running pass: Float2IntPass -; CHECK-POSTLINK-O-NEXT: Running pass: LowerConstantIntrinsicsPass ; CHECK-POSTLINK-O-NEXT: Running pass: FunctionToLoopPassAdaptor<{{.*}}LoopRotatePass ; CHECK-POSTLINK-O-NEXT: Starting llvm::Function pass manager run ; CHECK-POSTLINK-O-NEXT: Running pass: LoopSimplifyPass diff --git a/llvm/test/Other/opt-O2-pipeline.ll b/llvm/test/Other/opt-O2-pipeline.ll index e1f19e74733..f8603ef12a7 100644 --- a/llvm/test/Other/opt-O2-pipeline.ll +++ b/llvm/test/Other/opt-O2-pipeline.ll @@ -187,8 +187,6 @@ ; CHECK-NEXT: FunctionPass Manager ; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Float to int -; CHECK-NEXT: Lower constant intrinsics -; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Basic Alias Analysis (stateless AA impl) ; CHECK-NEXT: Function Alias Analysis Results ; CHECK-NEXT: Memory SSA diff --git a/llvm/test/Other/opt-O3-pipeline.ll b/llvm/test/Other/opt-O3-pipeline.ll index 3bfb921efc6..5f02df4ea70 100644 --- a/llvm/test/Other/opt-O3-pipeline.ll +++ b/llvm/test/Other/opt-O3-pipeline.ll @@ -192,8 +192,6 @@ ; CHECK-NEXT: FunctionPass Manager ; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Float to int -; CHECK-NEXT: Lower constant intrinsics -; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Basic Alias Analysis (stateless AA impl) ; CHECK-NEXT: Function Alias Analysis Results ; CHECK-NEXT: Memory SSA diff --git a/llvm/test/Other/opt-Os-pipeline.ll b/llvm/test/Other/opt-Os-pipeline.ll index 02271fb2032..127ccede060 100644 --- a/llvm/test/Other/opt-Os-pipeline.ll +++ b/llvm/test/Other/opt-Os-pipeline.ll @@ -174,8 +174,6 @@ ; CHECK-NEXT: FunctionPass Manager ; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Float to int -; CHECK-NEXT: Lower constant intrinsics -; CHECK-NEXT: Dominator Tree Construction ; CHECK-NEXT: Basic Alias Analysis (stateless AA impl) ; CHECK-NEXT: Function Alias Analysis Results ; CHECK-NEXT: Memory SSA diff --git a/llvm/test/Transforms/CodeGenPrepare/X86/overflow-intrinsics.ll b/llvm/test/Transforms/CodeGenPrepare/X86/overflow-intrinsics.ll index 9ba1d7db5ad..fc6d66a6082 100644 --- a/llvm/test/Transforms/CodeGenPrepare/X86/overflow-intrinsics.ll +++ b/llvm/test/Transforms/CodeGenPrepare/X86/overflow-intrinsics.ll @@ -514,6 +514,26 @@ exit: ret void } +; This was crashing when trying to delay instruction removal/deletion. + +declare i64 @llvm.objectsize.i64.p0i8(i8*, i1 immarg, i1 immarg, i1 immarg) #0 + +define hidden fastcc void @crash() { +; CHECK-LABEL: @crash( +; CHECK-NEXT: [[TMP1:%.*]] = call { i64, i1 } @llvm.uadd.with.overflow.i64(i64 undef, i64 undef) +; CHECK-NEXT: [[MATH:%.*]] = extractvalue { i64, i1 } [[TMP1]], 0 +; CHECK-NEXT: [[OV:%.*]] = extractvalue { i64, i1 } [[TMP1]], 1 +; CHECK-NEXT: [[T2:%.*]] = select i1 undef, i1 undef, i1 [[OV]] +; CHECK-NEXT: unreachable +; + %t0 = add i64 undef, undef + %t1 = icmp ult i64 %t0, undef + %t2 = select i1 undef, i1 undef, i1 %t1 + %t3 = call i64 @llvm.objectsize.i64.p0i8(i8* nonnull undef, i1 false, i1 false, i1 false) + %t4 = icmp ugt i64 %t3, 7 + unreachable +} + ; Check that every instruction inserted by -codegenprepare has a debug location. ; DEBUG: CheckModuleDebugify: PASS diff --git a/llvm/test/Transforms/LowerConstantIntrinsics/objectsize_basic.ll b/llvm/test/Transforms/CodeGenPrepare/basic.ll index 94aba44fcc4..1a58d61b6e9 100644 --- a/llvm/test/Transforms/LowerConstantIntrinsics/objectsize_basic.ll +++ b/llvm/test/Transforms/CodeGenPrepare/basic.ll @@ -1,15 +1,12 @@ -; RUN: opt -lower-constant-intrinsics -S < %s | FileCheck %s +; RUN: opt -codegenprepare -S < %s | FileCheck %s target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64" target triple = "x86_64-apple-darwin10.0.0" -declare i64 @llvm.objectsize.i64(i8*, i1, i1, i1) nounwind readonly -declare i64 @llvm.objectsize.i64.p1i8(i8 addrspace(1)*, i1, i1, i1) nounwind readonly -declare void @llvm.trap() nounwind - ; CHECK-LABEL: @test1( ; objectsize should fold to a constant, which causes the branch to fold to an -; uncond branch. +; uncond branch. Next, we fold the control flow alltogether. +; rdar://8785296 define i32 @test1(i8* %ptr) nounwind ssp noredzone align 2 { entry: %0 = tail call i64 @llvm.objectsize.i64(i8* %ptr, i1 false, i1 false, i1 false) @@ -17,7 +14,7 @@ entry: br i1 %1, label %T, label %trap ; CHECK: entry: -; CHECK-NOT: label %trap +; CHECK-NOT: br label % trap: ; preds = %0, %entry tail call void @llvm.trap() noreturn nounwind @@ -81,3 +78,9 @@ entry: i1 false, i1 false) ret i64 %0 } + + +declare i64 @llvm.objectsize.i64(i8*, i1, i1, i1) nounwind readonly +declare i64 @llvm.objectsize.i64.p1i8(i8 addrspace(1)*, i1, i1, i1) nounwind readonly + +declare void @llvm.trap() nounwind diff --git a/llvm/test/Transforms/CodeGenPrepare/builtin-condition.ll b/llvm/test/Transforms/CodeGenPrepare/builtin-condition.ll new file mode 100644 index 00000000000..e42529a7b9a --- /dev/null +++ b/llvm/test/Transforms/CodeGenPrepare/builtin-condition.ll @@ -0,0 +1,123 @@ +; RUN: opt -codegenprepare -S < %s | FileCheck %s + +; Ensure we act sanely on overflow. +; CHECK-LABEL: define i32 @bar +define i32 @bar() { +entry: + ; CHECK: ret i32 -1 + %az = alloca [2147483649 x i32], align 16 + %a = alloca i8*, align 8 + %arraydecay = getelementptr inbounds [2147483649 x i32], [2147483649 x i32]* %az, i32 0, i32 0 + %0 = bitcast i32* %arraydecay to i8* + store i8* %0, i8** %a, align 8 + %1 = load i8*, i8** %a, align 8 + %2 = call i32 @llvm.objectsize.i32.p0i8(i8* %1, i1 false) + ret i32 %2 +} + +; CHECK-LABEL: define i32 @baz +define i32 @baz(i32 %n) { +entry: + ; CHECK: ret i32 -1 + %az = alloca [1 x i32], align 16 + %bz = alloca [4294967297 x i32], align 16 + %tobool = icmp ne i32 %n, 0 + %arraydecay = getelementptr inbounds [1 x i32], [1 x i32]* %az, i64 0, i64 0 + %arraydecay1 = getelementptr inbounds [4294967297 x i32], [4294967297 x i32]* %bz, i64 0, i64 0 + %cond = select i1 %tobool, i32* %arraydecay, i32* %arraydecay1 + %0 = bitcast i32* %cond to i8* + %1 = call i32 @llvm.objectsize.i32.p0i8(i8* %0, i1 false) + ret i32 %1 +} + +declare i32 @llvm.objectsize.i32.p0i8(i8*, i1) + +; The following tests were generated by: +; #include<stdlib.h> +; #define STATIC_BUF_SIZE 10 +; #define LARGER_BUF_SIZE 30 +; +; size_t foo1(int flag) { +; char *cptr; +; char chararray[LARGER_BUF_SIZE]; +; char chararray2[STATIC_BUF_SIZE]; +; if(flag) +; cptr = chararray2; +; else +; cptr = chararray; +; +; return __builtin_object_size(cptr, 2); +; } +; +; size_t foo2(int n) { +; char Small[10]; +; char Large[20]; +; char *Ptr = n ? Small : Large + 19; +; return __builtin_object_size(Ptr, 0); +; } +; +; void foo() { +; size_t ret; +; size_t ret1; +; ret = foo1(0); +; ret1 = foo2(0); +; printf("\n%d %d\n", ret, ret1); +; } + +target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128" +target triple = "x86_64-unknown-linux-gnu" + +@.str = private unnamed_addr constant [8 x i8] c"\0A%d %d\0A\00", align 1 + +define i64 @foo1(i32 %flag) { +entry: + %chararray = alloca [30 x i8], align 16 + %chararray2 = alloca [10 x i8], align 1 + %0 = getelementptr inbounds [30 x i8], [30 x i8]* %chararray, i64 0, i64 0 + call void @llvm.lifetime.start.p0i8(i64 30, i8* %0) + %1 = getelementptr inbounds [10 x i8], [10 x i8]* %chararray2, i64 0, i64 0 + call void @llvm.lifetime.start.p0i8(i64 10, i8* %1) + %tobool = icmp eq i32 %flag, 0 + %cptr.0 = select i1 %tobool, i8* %0, i8* %1 + %2 = call i64 @llvm.objectsize.i64.p0i8(i8* %cptr.0, i1 true) + call void @llvm.lifetime.end.p0i8(i64 10, i8* %1) + call void @llvm.lifetime.end.p0i8(i64 30, i8* %0) + ret i64 %2 +; CHECK-LABEL: foo1 +; CHECK: ret i64 10 +} + +declare void @llvm.lifetime.start.p0i8(i64, i8* nocapture) + +declare i64 @llvm.objectsize.i64.p0i8(i8*, i1) + +declare void @llvm.lifetime.end.p0i8(i64, i8* nocapture) + +define i64 @foo2(i32 %n) { +entry: + %Small = alloca [10 x i8], align 1 + %Large = alloca [20 x i8], align 16 + %0 = getelementptr inbounds [10 x i8], [10 x i8]* %Small, i64 0, i64 0 + call void @llvm.lifetime.start.p0i8(i64 10, i8* %0) + %1 = getelementptr inbounds [20 x i8], [20 x i8]* %Large, i64 0, i64 0 + call void @llvm.lifetime.start.p0i8(i64 20, i8* %1) + %tobool = icmp ne i32 %n, 0 + %add.ptr = getelementptr inbounds [20 x i8], [20 x i8]* %Large, i64 0, i64 19 + %cond = select i1 %tobool, i8* %0, i8* %add.ptr + %2 = call i64 @llvm.objectsize.i64.p0i8(i8* %cond, i1 false) + call void @llvm.lifetime.end.p0i8(i64 20, i8* %1) + call void @llvm.lifetime.end.p0i8(i64 10, i8* %0) + ret i64 %2 +; CHECK-LABEL: foo2 +; CHECK: ret i64 10 +} + +define void @foo() { +entry: + %call = tail call i64 @foo1(i32 0) + %call1 = tail call i64 @foo2(i32 0) + %call2 = tail call i32 (i8*, ...) @printf(i8* getelementptr inbounds ([8 x i8], [8 x i8]* @.str, i64 0, i64 0), i64 %call, i64 %call1) + ret void +} + +declare i32 @printf(i8* nocapture readonly, ...) diff --git a/llvm/test/Transforms/LowerConstantIntrinsics/crash-on-large-allocas.ll b/llvm/test/Transforms/CodeGenPrepare/crash-on-large-allocas.ll index e4e981161fd..5049207ec27 100644 --- a/llvm/test/Transforms/LowerConstantIntrinsics/crash-on-large-allocas.ll +++ b/llvm/test/Transforms/CodeGenPrepare/crash-on-large-allocas.ll @@ -1,4 +1,4 @@ -; RUN: opt -S -lower-constant-intrinsics %s -o - | FileCheck %s +; RUN: opt -S -codegenprepare %s -o - | FileCheck %s ; ; Ensure that we don't {crash,return a bad value} when given an alloca larger ; than what a pointer can represent. diff --git a/llvm/test/Transforms/LowerConstantIntrinsics/constant-intrinsics.ll b/llvm/test/Transforms/LowerConstantIntrinsics/constant-intrinsics.ll deleted file mode 100644 index b2c98d2049c..00000000000 --- a/llvm/test/Transforms/LowerConstantIntrinsics/constant-intrinsics.ll +++ /dev/null @@ -1,114 +0,0 @@ -; RUN: opt -lower-constant-intrinsics -S < %s | FileCheck %s - -;; Ensure that an unfoldable is.constant gets lowered reasonably in -;; optimized codegen, in particular, that the "true" branch is -;; eliminated. - -;; Also ensure that any unfoldable objectsize is resolved in order. - -;; CHECK-NOT: tail call i32 @subfun_1() -;; CHECK: tail call i32 @subfun_2() -;; CHECK-NOT: tail call i32 @subfun_1() - -declare i1 @llvm.is.constant.i32(i32 %a) nounwind readnone -declare i1 @llvm.is.constant.i64(i64 %a) nounwind readnone -declare i1 @llvm.is.constant.i256(i256 %a) nounwind readnone -declare i1 @llvm.is.constant.v2i64(<2 x i64> %a) nounwind readnone -declare i1 @llvm.is.constant.f32(float %a) nounwind readnone -declare i1 @llvm.is.constant.sl_i32i32s({i32, i32} %a) nounwind readnone -declare i1 @llvm.is.constant.a2i64([2 x i64] %a) nounwind readnone -declare i1 @llvm.is.constant.p0i64(i64* %a) nounwind readnone - -declare i64 @llvm.objectsize.i64.p0i8(i8*, i1, i1, i1) nounwind readnone - -declare i32 @subfun_1() -declare i32 @subfun_2() - -define i32 @test_branch(i32 %in) nounwind { - %v = call i1 @llvm.is.constant.i32(i32 %in) - br i1 %v, label %True, label %False - -True: - %call1 = tail call i32 @subfun_1() - ret i32 %call1 - -False: - %call2 = tail call i32 @subfun_2() - ret i32 %call2 -} - -;; llvm.objectsize is another tricky case which gets folded to -1 very -;; late in the game. We'd like to ensure that llvm.is.constant of -;; llvm.objectsize is true. -define i1 @test_objectsize(i8* %obj) nounwind { -;; CHECK-LABEL: test_objectsize -;; CHECK-NOT: llvm.objectsize -;; CHECK-NOT: llvm.is.constant -;; CHECK: ret i1 true - %os = call i64 @llvm.objectsize.i64.p0i8(i8* %obj, i1 false, i1 false, i1 false) - %os1 = add i64 %os, 1 - %v = call i1 @llvm.is.constant.i64(i64 %os1) - ret i1 %v -} - -@test_phi_a = dso_local global i32 0, align 4 -declare dso_local i32 @test_phi_b(...) - -; Function Attrs: nounwind uwtable -define dso_local i32 @test_phi() { -entry: - %0 = load i32, i32* @test_phi_a, align 4 - %1 = tail call i1 @llvm.is.constant.i32(i32 %0) - br i1 %1, label %cond.end, label %cond.false - -cond.false: ; preds = %entry - %call = tail call i32 bitcast (i32 (...)* @test_phi_b to i32 ()*)() #3 - %.pre = load i32, i32* @test_phi_a, align 4 - br label %cond.end - -cond.end: ; preds = %entry, %cond.false - %2 = phi i32 [ %.pre, %cond.false ], [ %0, %entry ] - %cond = phi i32 [ %call, %cond.false ], [ 1, %entry ] - %cmp = icmp eq i32 %cond, %2 - br i1 %cmp, label %cond.true1, label %cond.end4 - -cond.true1: ; preds = %cond.end - %call2 = tail call i32 bitcast (i32 (...)* @test_phi_b to i32 ()*)() #3 - br label %cond.end4 - -cond.end4: ; preds = %cond.end, %cond.true1 - ret i32 undef -} - -define i1 @test_various_types(i256 %int, float %float, <2 x i64> %vec, {i32, i32} %struct, [2 x i64] %arr, i64* %ptr) #0 { -; CHECK-LABEL: @test_various_types( -; CHECK-NOT: llvm.is.constant - %v1 = call i1 @llvm.is.constant.i256(i256 %int) - %v2 = call i1 @llvm.is.constant.f32(float %float) - %v3 = call i1 @llvm.is.constant.v2i64(<2 x i64> %vec) - %v4 = call i1 @llvm.is.constant.sl_i32i32s({i32, i32} %struct) - %v5 = call i1 @llvm.is.constant.a2i64([2 x i64] %arr) - %v6 = call i1 @llvm.is.constant.p0i64(i64* %ptr) - - %c1 = call i1 @llvm.is.constant.i256(i256 -1) - %c2 = call i1 @llvm.is.constant.f32(float 17.0) - %c3 = call i1 @llvm.is.constant.v2i64(<2 x i64> <i64 -1, i64 44>) - %c4 = call i1 @llvm.is.constant.sl_i32i32s({i32, i32} {i32 -1, i32 32}) - %c5 = call i1 @llvm.is.constant.a2i64([2 x i64] [i64 -1, i64 32]) - %c6 = call i1 @llvm.is.constant.p0i64(i64* inttoptr (i32 42 to i64*)) - - %x1 = add i1 %v1, %c1 - %x2 = add i1 %v2, %c2 - %x3 = add i1 %v3, %c3 - %x4 = add i1 %v4, %c4 - %x5 = add i1 %v5, %c5 - %x6 = add i1 %v6, %c6 - - %res2 = add i1 %x1, %x2 - %res3 = add i1 %res2, %x3 - %res4 = add i1 %res3, %x4 - %res5 = add i1 %res4, %x5 - %res6 = add i1 %res5, %x6 - - ret i1 %res6 -} |