aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorChris Lattner <sabre@nondot.org>2008-04-10 05:13:43 +0000
committerChris Lattner <sabre@nondot.org>2008-04-10 05:13:43 +0000
commitdb66750753de3f6da8b4a3728dcbebb551f1328e (patch)
tree4a745fcf128def111ba4157cfd3c622741c33022
parent3dc2e96eec566f8c4e88a34296d6f10b840d7d1e (diff)
downloadexternal_llvm-db66750753de3f6da8b4a3728dcbebb551f1328e.zip
external_llvm-db66750753de3f6da8b4a3728dcbebb551f1328e.tar.gz
external_llvm-db66750753de3f6da8b4a3728dcbebb551f1328e.tar.bz2
Fix the x86-64 side of PR2108 by adding a v2f64 version of
MOVZQI2PQIrr. This would be better handled as a dag combine (with the goal of eliminating the bitconvert) but I don't know how to do that safely. Thoughts welcome. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@49463 91177308-0d34-0410-b5e6-96231b3b80d8
-rw-r--r--lib/Target/X86/X86InstrSSE.td10
-rw-r--r--test/CodeGen/X86/vec_shuffle-17.ll13
2 files changed, 23 insertions, 0 deletions
diff --git a/lib/Target/X86/X86InstrSSE.td b/lib/Target/X86/X86InstrSSE.td
index dbc04b0..442847c 100644
--- a/lib/Target/X86/X86InstrSSE.td
+++ b/lib/Target/X86/X86InstrSSE.td
@@ -2305,6 +2305,16 @@ def MOVZQI2PQIrr : RPDI<0x6E, MRMSrcReg, (outs VR128:$dst), (ins GR64:$src),
MOVL_shuffle_mask)))]>;
}
+// Handle the v2f64 form of 'MOVZQI2PQIrr' for PR2108. FIXME: this would be
+// better written as a dag combine xform.
+let AddedComplexity = 15 in
+def : Pat<(v2f64 (vector_shuffle immAllZerosV_bc,
+ (v2f64 (scalar_to_vector
+ (f64 (bitconvert GR64:$src)))),
+ MOVL_shuffle_mask)),
+ (MOVZQI2PQIrr GR64:$src)>, Requires<[HasSSE3]>;
+
+
let AddedComplexity = 20 in {
def MOVZDI2PDIrm : PDI<0x6E, MRMSrcMem, (outs VR128:$dst), (ins i32mem:$src),
"movd\t{$src, $dst|$dst, $src}",
diff --git a/test/CodeGen/X86/vec_shuffle-17.ll b/test/CodeGen/X86/vec_shuffle-17.ll
new file mode 100644
index 0000000..992d791
--- /dev/null
+++ b/test/CodeGen/X86/vec_shuffle-17.ll
@@ -0,0 +1,13 @@
+; RUN: llvm-as < %s | llc -march=x86-64 | grep {movd.*%rdi, %xmm0}
+; RUN: llvm-as < %s | llc -march=x86-64 | not grep xor
+; PR2108
+
+define <2 x i64> @doload64(i64 %x) nounwind {
+entry:
+ %tmp717 = bitcast i64 %x to double ; <double> [#uses=1]
+ %tmp8 = insertelement <2 x double> undef, double %tmp717, i32 0 ; <<2 x double>> [#uses=1]
+ %tmp9 = insertelement <2 x double> %tmp8, double 0.000000e+00, i32 1 ; <<2 x double>> [#uses=1]
+ %tmp11 = bitcast <2 x double> %tmp9 to <2 x i64> ; <<2 x i64>> [#uses=1]
+ ret <2 x i64> %tmp11
+}
+