diff options
author | Andrea Di Biagio <Andrea_DiBiagio@sn.scee.net> | 2015-01-06 17:41:18 +0000 |
---|---|---|
committer | Andrea Di Biagio <Andrea_DiBiagio@sn.scee.net> | 2015-01-06 17:41:18 +0000 |
commit | f807a6f2970398b85ccd2a3ba6d8959426a9872f (patch) | |
tree | 911eb76a03413e1686ee193038b3d84907aef6a6 /llvm/test/CodeGen/X86/cttz-ctlz.ll | |
parent | a76dfbd4288271d3a61fe2f4307c406780ce7c49 (diff) | |
download | bcm5719-llvm-f807a6f2970398b85ccd2a3ba6d8959426a9872f.tar.gz bcm5719-llvm-f807a6f2970398b85ccd2a3ba6d8959426a9872f.zip |
[CodeGenPrepare] Improved logic to speculate calls to cttz/ctlz.
This patch improves the logic added at revision 224899 (see review D6728) that
teaches the backend when it is profitable to speculate calls to cttz/ctlz.
The original algorithm conservatively avoided speculating more than one
instruction from a basic block in a control flow grap modelling an if-statement.
In particular, the only allowed instruction (excluding the terminator) was a
call to cttz/ctlz. However, there are cases where we could be less conservative
and still be able to speculate a call to cttz/ctlz.
With this patch, CodeGenPrepare now tries to speculate a cttz/ctlz if the
result is zero extended/truncated in the same basic block, and the zext/trunc
instruction is "free" for the target.
Added new test cases to CodeGen/X86/cttz-ctlz.ll
Differential Revision: http://reviews.llvm.org/D6853
llvm-svn: 225274
Diffstat (limited to 'llvm/test/CodeGen/X86/cttz-ctlz.ll')
-rw-r--r-- | llvm/test/CodeGen/X86/cttz-ctlz.ll | 172 |
1 files changed, 172 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/X86/cttz-ctlz.ll b/llvm/test/CodeGen/X86/cttz-ctlz.ll index 88dcf650a21..8717d401595 100644 --- a/llvm/test/CodeGen/X86/cttz-ctlz.ll +++ b/llvm/test/CodeGen/X86/cttz-ctlz.ll @@ -241,6 +241,178 @@ cond.end: ; preds = %entry, %cond.true ret i16 %cond } +; The following tests verify that calls to cttz/ctlz are speculated even if +; basic block %cond.true has an extra zero extend/truncate which is "free" +; for the target. + +define i64 @test1e(i32 %x) { +; ALL-LABEL: @test1e( +; LZCNT: icmp eq i32 %x, 0 +; LZCNT: call i32 @llvm.cttz.i32(i32 %x, i1 true) +; BMI: call i32 @llvm.cttz.i32(i32 %x, i1 false) +; GENERIC: icmp eq i32 %x, 0 +; GENERIC: call i32 @llvm.cttz.i32(i32 %x, i1 true) +entry: + %tobool = icmp eq i32 %x, 0 + br i1 %tobool, label %cond.end, label %cond.true + +cond.true: ; preds = %entry + %0 = tail call i32 @llvm.cttz.i32(i32 %x, i1 true) + %phitmp2 = zext i32 %0 to i64 + br label %cond.end + +cond.end: ; preds = %entry, %cond.true + %cond = phi i64 [ %phitmp2, %cond.true ], [ 32, %entry ] + ret i64 %cond +} + +define i32 @test2e(i64 %x) { +; ALL-LABEL: @test2e( +; LZCNT: icmp eq i64 %x, 0 +; LZCNT: call i64 @llvm.cttz.i64(i64 %x, i1 true) +; BMI: call i64 @llvm.cttz.i64(i64 %x, i1 false) +; GENERIC: icmp eq i64 %x, 0 +; GENERIC: call i64 @llvm.cttz.i64(i64 %x, i1 true) +entry: + %tobool = icmp eq i64 %x, 0 + br i1 %tobool, label %cond.end, label %cond.true + +cond.true: ; preds = %entry + %0 = tail call i64 @llvm.cttz.i64(i64 %x, i1 true) + %cast = trunc i64 %0 to i32 + br label %cond.end + +cond.end: ; preds = %entry, %cond.true + %cond = phi i32 [ %cast, %cond.true ], [ 64, %entry ] + ret i32 %cond +} + +define i64 @test3e(i32 %x) { +; ALL-LABEL: @test3e( +; BMI: icmp eq i32 %x, 0 +; BMI: call i32 @llvm.ctlz.i32(i32 %x, i1 true) +; LZCNT: call i32 @llvm.ctlz.i32(i32 %x, i1 false) +; GENERIC: icmp eq i32 %x, 0 +; GENERIC: call i32 @llvm.ctlz.i32(i32 %x, i1 true) +entry: + %tobool = icmp eq i32 %x, 0 + br i1 %tobool, label %cond.end, label %cond.true + +cond.true: ; preds = %entry + %0 = tail call i32 @llvm.ctlz.i32(i32 %x, i1 true) + %phitmp2 = zext i32 %0 to i64 + br label %cond.end + +cond.end: ; preds = %entry, %cond.true + %cond = phi i64 [ %phitmp2, %cond.true ], [ 32, %entry ] + ret i64 %cond +} + +define i32 @test4e(i64 %x) { +; ALL-LABEL: @test4e( +; BMI: icmp eq i64 %x, 0 +; BMI: call i64 @llvm.ctlz.i64(i64 %x, i1 true) +; LZCNT: call i64 @llvm.ctlz.i64(i64 %x, i1 false) +; GENERIC: icmp eq i64 %x, 0 +; GENERIC: call i64 @llvm.ctlz.i64(i64 %x, i1 true) +entry: + %tobool = icmp eq i64 %x, 0 + br i1 %tobool, label %cond.end, label %cond.true + +cond.true: ; preds = %entry + %0 = tail call i64 @llvm.ctlz.i64(i64 %x, i1 true) + %cast = trunc i64 %0 to i32 + br label %cond.end + +cond.end: ; preds = %entry, %cond.true + %cond = phi i32 [ %cast, %cond.true ], [ 64, %entry ] + ret i32 %cond +} + +define i16 @test5e(i64 %x) { +; ALL-LABEL: @test5e( +; BMI: icmp eq i64 %x, 0 +; BMI: call i64 @llvm.ctlz.i64(i64 %x, i1 true) +; LZCNT: call i64 @llvm.ctlz.i64(i64 %x, i1 false) +; GENERIC: icmp eq i64 %x, 0 +; GENERIC: call i64 @llvm.ctlz.i64(i64 %x, i1 true) +entry: + %tobool = icmp eq i64 %x, 0 + br i1 %tobool, label %cond.end, label %cond.true + +cond.true: ; preds = %entry + %0 = tail call i64 @llvm.ctlz.i64(i64 %x, i1 true) + %cast = trunc i64 %0 to i16 + br label %cond.end + +cond.end: ; preds = %entry, %cond.true + %cond = phi i16 [ %cast, %cond.true ], [ 64, %entry ] + ret i16 %cond +} + +define i16 @test6e(i32 %x) { +; ALL-LABEL: @test6e( +; BMI: icmp eq i32 %x, 0 +; BMI: call i32 @llvm.ctlz.i32(i32 %x, i1 true) +; LZCNT: call i32 @llvm.ctlz.i32(i32 %x, i1 false) +; GENERIC: icmp eq i32 %x, 0 +; GENERIC: call i32 @llvm.ctlz.i32(i32 %x, i1 true) +entry: + %tobool = icmp eq i32 %x, 0 + br i1 %tobool, label %cond.end, label %cond.true + +cond.true: ; preds = %entry + %0 = tail call i32 @llvm.ctlz.i32(i32 %x, i1 true) + %cast = trunc i32 %0 to i16 + br label %cond.end + +cond.end: ; preds = %entry, %cond.true + %cond = phi i16 [ %cast, %cond.true ], [ 32, %entry ] + ret i16 %cond +} + +define i16 @test7e(i64 %x) { +; ALL-LABEL: @test7e( +; LZCNT: icmp eq i64 %x, 0 +; LZCNT: call i64 @llvm.cttz.i64(i64 %x, i1 true) +; BMI: call i64 @llvm.cttz.i64(i64 %x, i1 false) +; GENERIC: icmp eq i64 %x, 0 +; GENERIC: call i64 @llvm.cttz.i64(i64 %x, i1 true) +entry: + %tobool = icmp eq i64 %x, 0 + br i1 %tobool, label %cond.end, label %cond.true + +cond.true: ; preds = %entry + %0 = tail call i64 @llvm.cttz.i64(i64 %x, i1 true) + %cast = trunc i64 %0 to i16 + br label %cond.end + +cond.end: ; preds = %entry, %cond.true + %cond = phi i16 [ %cast, %cond.true ], [ 64, %entry ] + ret i16 %cond +} + +define i16 @test8e(i32 %x) { +; ALL-LABEL: @test8e( +; LZCNT: icmp eq i32 %x, 0 +; LZCNT: call i32 @llvm.cttz.i32(i32 %x, i1 true) +; BMI: call i32 @llvm.cttz.i32(i32 %x, i1 false) +; GENERIC: icmp eq i32 %x, 0 +; GENERIC: call i32 @llvm.cttz.i32(i32 %x, i1 true) +entry: + %tobool = icmp eq i32 %x, 0 + br i1 %tobool, label %cond.end, label %cond.true + +cond.true: ; preds = %entry + %0 = tail call i32 @llvm.cttz.i32(i32 %x, i1 true) + %cast = trunc i32 %0 to i16 + br label %cond.end + +cond.end: ; preds = %entry, %cond.true + %cond = phi i16 [ %cast, %cond.true ], [ 32, %entry ] + ret i16 %cond +} + declare i64 @llvm.ctlz.i64(i64, i1) declare i32 @llvm.ctlz.i32(i32, i1) |