aboutsummaryrefslogtreecommitdiffstats
path: root/test/CodeGen/X86/vec_shuffle-23.ll
diff options
context:
space:
mode:
authorEvan Cheng <evan.cheng@apple.com>2008-09-26 23:41:32 +0000
committerEvan Cheng <evan.cheng@apple.com>2008-09-26 23:41:32 +0000
commitb7a75a5a541a836d07cfc5ccebd70bb5e42f797f (patch)
tree66181d36082ae4203edbca00c97e614e31fc7f3b /test/CodeGen/X86/vec_shuffle-23.ll
parent19c874638d9478a5d5028854817a5ee72293bb2b (diff)
downloadexternal_llvm-b7a75a5a541a836d07cfc5ccebd70bb5e42f797f.zip
external_llvm-b7a75a5a541a836d07cfc5ccebd70bb5e42f797f.tar.gz
external_llvm-b7a75a5a541a836d07cfc5ccebd70bb5e42f797f.tar.bz2
Implement "punpckldq %xmm0, $xmm0" as "pshufd $0x50, %xmm0, %xmm" unless optimizing for code size.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@56711 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'test/CodeGen/X86/vec_shuffle-23.ll')
-rw-r--r--test/CodeGen/X86/vec_shuffle-23.ll19
1 files changed, 19 insertions, 0 deletions
diff --git a/test/CodeGen/X86/vec_shuffle-23.ll b/test/CodeGen/X86/vec_shuffle-23.ll
new file mode 100644
index 0000000..34d84ef
--- /dev/null
+++ b/test/CodeGen/X86/vec_shuffle-23.ll
@@ -0,0 +1,19 @@
+; RUN: llvm-as < %s | llc -march=x86 -mattr=+sse2 | not grep punpck
+; RUN: llvm-as < %s | llc -march=x86 -mattr=+sse2 | grep pshufd
+; RUN: llvm-as < %s | llc -march=x86 -mattr=+sse2 -optimize-size | grep punpck
+
+define i32 @t() nounwind {
+entry:
+ %a = alloca <4 x i32> ; <<4 x i32>*> [#uses=2]
+ %b = alloca <4 x i32> ; <<4 x i32>*> [#uses=5]
+ volatile store <4 x i32> < i32 0, i32 1, i32 2, i32 3 >, <4 x i32>* %a
+ %tmp = load <4 x i32>* %a ; <<4 x i32>> [#uses=1]
+ store <4 x i32> %tmp, <4 x i32>* %b
+ %tmp1 = load <4 x i32>* %b ; <<4 x i32>> [#uses=1]
+ %tmp2 = load <4 x i32>* %b ; <<4 x i32>> [#uses=1]
+ %punpckldq = shufflevector <4 x i32> %tmp1, <4 x i32> %tmp2, <4 x i32> < i32 0, i32 4, i32 1, i32 5 > ; <<4 x i32>> [#uses=1]
+ store <4 x i32> %punpckldq, <4 x i32>* %b
+ %tmp3 = load <4 x i32>* %b ; <<4 x i32>> [#uses=1]
+ %result = extractelement <4 x i32> %tmp3, i32 0 ; <i32> [#uses=1]
+ ret i32 %result
+}