diff options
| author | Evan Cheng <evan.cheng@apple.com> | 2009-01-27 03:30:42 +0000 |
|---|---|---|
| committer | Evan Cheng <evan.cheng@apple.com> | 2009-01-27 03:30:42 +0000 |
| commit | 1bc8af207ef075bea5dce5fd98ec45918a8dcad6 (patch) | |
| tree | 6ee9cc17b4a691fc30bb7fbc72e794274d92edcc /llvm | |
| parent | ce95cddd0fddee773e7b8311573ac20fecbd0589 (diff) | |
| download | bcm5719-llvm-1bc8af207ef075bea5dce5fd98ec45918a8dcad6.tar.gz bcm5719-llvm-1bc8af207ef075bea5dce5fd98ec45918a8dcad6.zip | |
Implement multiple with overflow by 2 with an add instruction.
llvm-svn: 63090
Diffstat (limited to 'llvm')
| -rw-r--r-- | llvm/lib/Target/X86/X86InstrInfo.td | 11 | ||||
| -rw-r--r-- | llvm/test/CodeGen/X86/smul-with-overflow-2.ll | 20 |
2 files changed, 31 insertions, 0 deletions
diff --git a/llvm/lib/Target/X86/X86InstrInfo.td b/llvm/lib/Target/X86/X86InstrInfo.td index 9649c234de4..f4a57be007e 100644 --- a/llvm/lib/Target/X86/X86InstrInfo.td +++ b/llvm/lib/Target/X86/X86InstrInfo.td @@ -3612,6 +3612,17 @@ def : Pat<(parallel (X86smul_ovf (load addr:$src1), i32immSExt8:$src2), (implicit EFLAGS)), (IMUL32rmi8 addr:$src1, i32immSExt8:$src2)>; +// Optimize multiple with overflow by 2. +let AddedComplexity = 2 in { +def : Pat<(parallel (X86smul_ovf GR16:$src1, 2), + (implicit EFLAGS)), + (ADD16rr GR16:$src1, GR16:$src1)>; + +def : Pat<(parallel (X86smul_ovf GR32:$src1, 2), + (implicit EFLAGS)), + (ADD32rr GR32:$src1, GR32:$src1)>; +} + //===----------------------------------------------------------------------===// // Floating Point Stack Support //===----------------------------------------------------------------------===// diff --git a/llvm/test/CodeGen/X86/smul-with-overflow-2.ll b/llvm/test/CodeGen/X86/smul-with-overflow-2.ll new file mode 100644 index 00000000000..c3dbfd796f2 --- /dev/null +++ b/llvm/test/CodeGen/X86/smul-with-overflow-2.ll @@ -0,0 +1,20 @@ +; RUN: llvm-as < %s | llc -march=x86 | grep mul | count 1 +; RUN: llvm-as < %s | llc -march=x86 | grep add | count 3 + +define i32 @t1(i32 %a, i32 %b) nounwind readnone { +entry: + %tmp0 = add i32 %b, %a + %tmp1 = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 %tmp0, i32 2) + %tmp2 = extractvalue { i32, i1 } %tmp1, 0 + ret i32 %tmp2 +} + +define i32 @t2(i32 %a, i32 %b) nounwind readnone { +entry: + %tmp0 = add i32 %b, %a + %tmp1 = call { i32, i1 } @llvm.smul.with.overflow.i32(i32 %tmp0, i32 4) + %tmp2 = extractvalue { i32, i1 } %tmp1, 0 + ret i32 %tmp2 +} + +declare { i32, i1 } @llvm.smul.with.overflow.i32(i32, i32) nounwind |

