summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorChris Lattner <sabre@nondot.org>2008-04-10 05:13:43 +0000
committerChris Lattner <sabre@nondot.org>2008-04-10 05:13:43 +0000
commitad75302497abefa4456db252eeed56faebd54730 (patch)
tree85e815f0eb97427380cd0a623d9285d643df05f0
parent57dd77462bf3fd40b0880457bedefd41ba29d251 (diff)
downloadbcm5719-llvm-ad75302497abefa4456db252eeed56faebd54730.tar.gz
bcm5719-llvm-ad75302497abefa4456db252eeed56faebd54730.zip
Fix the x86-64 side of PR2108 by adding a v2f64 version of
MOVZQI2PQIrr. This would be better handled as a dag combine (with the goal of eliminating the bitconvert) but I don't know how to do that safely. Thoughts welcome. llvm-svn: 49463
-rw-r--r--llvm/lib/Target/X86/X86InstrSSE.td10
-rw-r--r--llvm/test/CodeGen/X86/vec_shuffle-17.ll13
2 files changed, 23 insertions, 0 deletions
diff --git a/llvm/lib/Target/X86/X86InstrSSE.td b/llvm/lib/Target/X86/X86InstrSSE.td
index dbc04b01e20..442847cda8e 100644
--- a/llvm/lib/Target/X86/X86InstrSSE.td
+++ b/llvm/lib/Target/X86/X86InstrSSE.td
@@ -2305,6 +2305,16 @@ def MOVZQI2PQIrr : RPDI<0x6E, MRMSrcReg, (outs VR128:$dst), (ins GR64:$src),
MOVL_shuffle_mask)))]>;
}
+// Handle the v2f64 form of 'MOVZQI2PQIrr' for PR2108. FIXME: this would be
+// better written as a dag combine xform.
+let AddedComplexity = 15 in
+def : Pat<(v2f64 (vector_shuffle immAllZerosV_bc,
+ (v2f64 (scalar_to_vector
+ (f64 (bitconvert GR64:$src)))),
+ MOVL_shuffle_mask)),
+ (MOVZQI2PQIrr GR64:$src)>, Requires<[HasSSE3]>;
+
+
let AddedComplexity = 20 in {
def MOVZDI2PDIrm : PDI<0x6E, MRMSrcMem, (outs VR128:$dst), (ins i32mem:$src),
"movd\t{$src, $dst|$dst, $src}",
diff --git a/llvm/test/CodeGen/X86/vec_shuffle-17.ll b/llvm/test/CodeGen/X86/vec_shuffle-17.ll
new file mode 100644
index 00000000000..992d79184b8
--- /dev/null
+++ b/llvm/test/CodeGen/X86/vec_shuffle-17.ll
@@ -0,0 +1,13 @@
+; RUN: llvm-as < %s | llc -march=x86-64 | grep {movd.*%rdi, %xmm0}
+; RUN: llvm-as < %s | llc -march=x86-64 | not grep xor
+; PR2108
+
+define <2 x i64> @doload64(i64 %x) nounwind {
+entry:
+ %tmp717 = bitcast i64 %x to double ; <double> [#uses=1]
+ %tmp8 = insertelement <2 x double> undef, double %tmp717, i32 0 ; <<2 x double>> [#uses=1]
+ %tmp9 = insertelement <2 x double> %tmp8, double 0.000000e+00, i32 1 ; <<2 x double>> [#uses=1]
+ %tmp11 = bitcast <2 x double> %tmp9 to <2 x i64> ; <<2 x i64>> [#uses=1]
+ ret <2 x i64> %tmp11
+}
+
OpenPOWER on IntegriCloud