diff options
author | QingShan Zhang <qshanz@cn.ibm.com> | 2018-09-07 07:56:05 +0000 |
---|---|---|
committer | QingShan Zhang <qshanz@cn.ibm.com> | 2018-09-07 07:56:05 +0000 |
commit | abbb894ff58cff160f81954d794d009c3cb92eb9 (patch) | |
tree | 54b3d22f3eaaabc253c5a786e0a828cec9c9011f /llvm/test/CodeGen/PowerPC | |
parent | 9e6845d8e12e4dba18e62a04a7980860eb3f46d2 (diff) | |
download | bcm5719-llvm-abbb894ff58cff160f81954d794d009c3cb92eb9.tar.gz bcm5719-llvm-abbb894ff58cff160f81954d794d009c3cb92eb9.zip |
[PowerPC] Combine ADD to ADDZE
On the ppc64le platform, if ir has the following form,
define i64 @addze1(i64 %x, i64 %z) local_unnamed_addr #0 {
entry:
%cmp = icmp ne i64 %z, CONSTANT (-32767 <= CONSTANT <= 32768)
%conv1 = zext i1 %cmp to i64
%add = add nsw i64 %conv1, %x
ret i64 %add
}
we can optimize it to the form below.
when C == 0
--> addze X, (addic Z, -1))
/
add X, (zext(setne Z, C))--
\ when -32768 <= -C <= 32767 && C != 0
--> addze X, (addic (addi Z, -C), -1)
Patch By: HLJ2009 (Li Jia He)
Differential Revision: https://reviews.llvm.org/D51403
Reviewed By: Nemanjai
llvm-svn: 341634
Diffstat (limited to 'llvm/test/CodeGen/PowerPC')
-rw-r--r-- | llvm/test/CodeGen/PowerPC/addze.ll | 172 |
1 files changed, 172 insertions, 0 deletions
diff --git a/llvm/test/CodeGen/PowerPC/addze.ll b/llvm/test/CodeGen/PowerPC/addze.ll new file mode 100644 index 00000000000..212da8b4990 --- /dev/null +++ b/llvm/test/CodeGen/PowerPC/addze.ll @@ -0,0 +1,172 @@ +; RUN: llc -verify-machineinstrs -mtriple=powerpc64-unknown-unknown \ +; RUN: -ppc-asm-full-reg-names -mcpu=pwr9 < %s | FileCheck %s +; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-unknown \ +; RUN: -ppc-asm-full-reg-names -mcpu=pwr9 < %s | FileCheck %s + +define i64 @addze1(i64 %X, i64 %Z) { +; CHECK-LABEL: addze1: +; CHECK: # %bb.0: +; CHECK-NEXT: addic [[REG1:r[0-9]+]], [[REG1]], -1 +; CHECK-NEXT: addze [[REG2:r[0-9]+]], [[REG2]] +; CHECK-NEXT: blr + %cmp = icmp ne i64 %Z, 0 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @addze2(i64 %X, i64 %Z) { +; CHECK-LABEL: addze2: +; CHECK: # %bb.0: +; CHECK-NEXT: subfic [[REG1:r[0-9]+]], [[REG1]], 0 +; CHECK-NEXT: addze [[REG2:r[0-9]+]], [[REG2]] +; CHECK-NEXT: blr + %cmp = icmp eq i64 %Z, 0 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @addze3(i64 %X, i64 %Z) { +; CHECK-LABEL: addze3: +; CHECK: # %bb.0: +; CHECK-NEXT: addi [[REG1:r[0-9]+]], [[REG1]], -32768 +; CHECK-NEXT: addic [[REG1]], [[REG1]], -1 +; CHECK-NEXT: addze [[REG2:r[0-9]+]], [[REG2]] +; CHECK-NEXT: blr + %cmp = icmp ne i64 %Z, 32768 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @addze4(i64 %X, i64 %Z) { +; CHECK-LABEL: addze4: +; CHECK: # %bb.0: +; CHECK-NEXT: addi [[REG1:r[0-9]+]], [[REG1]], -32768 +; CHECK-NEXT: subfic [[REG1]], [[REG1]], 0 +; CHECK-NEXT: addze [[REG2:r[0-9]+]], [[REG2]] +; CHECK-NEXT: blr + %cmp = icmp eq i64 %Z, 32768 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @addze5(i64 %X, i64 %Z) { +; CHECK-LABEL: addze5: +; CHECK: # %bb.0: +; CHECK-NEXT: addi [[REG1:r[0-9]+]], [[REG1]], 32767 +; CHECK-NEXT: addic [[REG1]], [[REG1]], -1 +; CHECK-NEXT: addze [[REG2:r[0-9]+]], [[REG2]] +; CHECK-NEXT: blr + %cmp = icmp ne i64 %Z, -32767 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @addze6(i64 %X, i64 %Z) { +; CHECK-LABEL: addze6: +; CHECK: # %bb.0: +; CHECK-NEXT: addi [[REG1:r[0-9]+]], [[REG1]], 32767 +; CHECK-NEXT: subfic [[REG1]], [[REG1]], 0 +; CHECK-NEXT: addze [[REG2:r[0-9]+]], [[REG2]] +; CHECK-NEXT: blr + %cmp = icmp eq i64 %Z, -32767 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +; element is out of range +define i64 @test1(i64 %X, i64 %Z) { +; CHECK-LABEL: test1: +; CHECK: # %bb.0: +; CHECK-NEXT: li [[REG1:r[0-9]+]], -32768 +; CHECK-NEXT: xor [[REG2:r[0-9]+]], [[REG2]], [[REG1]] +; CHECK-NEXT: addic [[REG1]], [[REG2]], -1 +; CHECK-NEXT: subfe [[REG2]], [[REG1]], [[REG2]] +; CHECK-NEXT: add [[REG3:r[0-9]+]], [[REG2]], [[REG3]] +; CHECK-NEXT: blr + %cmp = icmp ne i64 %Z, -32768 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @test2(i64 %X, i64 %Z) { +; CHECK-LABEL: test2: +; CHECK: # %bb.0: +; CHECK-NEXT: li [[REG1:r[0-9]+]], -32768 +; CHECK-NEXT: xor [[REG2:r[0-9]+]], [[REG2]], [[REG1]] +; CHECK-NEXT: cntlzd [[REG2]], [[REG2]] +; CHECK-NEXT: rldicl [[REG2]], [[REG2]], 58, 63 +; CHECK-NEXT: add [[REG3:r[0-9]+]], [[REG2]], [[REG3]] +; CHECK-NEXT: blr + %cmp = icmp eq i64 %Z, -32768 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @test3(i64 %X, i64 %Z) { +; CHECK-LABEL: test3: +; CHECK: # %bb.0: +; CHECK-NEXT: li [[REG1:r[0-9]+]], 0 +; CHECK-NEXT: ori [[REG1]], [[REG1]], 32769 +; CHECK-NEXT: xor [[REG2:r[0-9]+]], [[REG2]], [[REG1]] +; CHECK-NEXT: addic [[REG1]], [[REG2]], -1 +; CHECK-NEXT: subfe [[REG2]], [[REG1]], [[REG2]] +; CHECK-NEXT: add [[REG3:r[0-9]+]], [[REG2]], [[REG3]] +; CHECK-NEXT: blr + %cmp = icmp ne i64 %Z, 32769 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @test4(i64 %X, i64 %Z) { +; CHECK-LABEL: test4: +; CHECK: # %bb.0: +; CHECK-NEXT: li [[REG1:r[0-9]+]], 0 +; CHECK-NEXT: ori [[REG1]], [[REG1]], 32769 +; CHECK-NEXT: xor [[REG2:r[0-9]+]], [[REG2]], [[REG1]] +; CHECK-NEXT: cntlzd [[REG2]], [[REG2]] +; CHECK-NEXT: rldicl [[REG2]], [[REG2]], 58, 63 +; CHECK-NEXT: add [[REG3:r[0-9]+]], [[REG2]], [[REG3]] +; CHECK-NEXT: blr + %cmp = icmp eq i64 %Z, 32769 + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +; comparison of two registers +define i64 @test5(i64 %X, i64 %Y, i64 %Z) { +; CHECK-LABEL: test5: +; CHECK: # %bb.0: +; CHECK-NEXT: xor [[REG2:r[0-9]+]], [[REG2]], [[REG1:r[0-9]+]] +; CHECK-NEXT: addic [[REG1]], [[REG2]], -1 +; CHECK-NEXT: subfe [[REG2]], [[REG1]], [[REG2]] +; CHECK-NEXT: add [[REG3:r[0-9]+]], [[REG2]], [[REG3]] +; CHECK-NEXT: blr + %cmp = icmp ne i64 %Y, %Z + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} + +define i64 @test6(i64 %X, i64 %Y, i64 %Z) { +; CHECK-LABEL: test6: +; CHECK: # %bb.0: +; CHECK-NEXT: xor [[REG2:r[0-9]+]], [[REG2]], [[REG1:r[0-9]+]] +; CHECK-NEXT: cntlzd [[REG2]], [[REG2]] +; CHECK-NEXT: rldicl [[REG2]], [[REG2]], 58, 63 +; CHECK-NEXT: add [[REG3:r[0-9]+]], [[REG2]], [[REG3]] +; CHECK-NEXT: blr + %cmp = icmp eq i64 %Y, %Z + %conv1 = zext i1 %cmp to i64 + %add = add nsw i64 %conv1, %X + ret i64 %add +} |