aboutsummaryrefslogtreecommitdiffstats
path: root/test/CodeGen/X86/opt-shuff-tstore.ll
diff options
context:
space:
mode:
authorNadav Rotem <nadav.rotem@intel.com>2011-08-10 19:30:14 +0000
committerNadav Rotem <nadav.rotem@intel.com>2011-08-10 19:30:14 +0000
commit614061bfb4fea3c1233ecf2676282e063724ae93 (patch)
tree39b076801d61771df2fc6bd98eb4c2f281c924e5 /test/CodeGen/X86/opt-shuff-tstore.ll
parent103b8e653c981fe916b855f1b96cb35e01c4543e (diff)
downloadexternal_llvm-614061bfb4fea3c1233ecf2676282e063724ae93.zip
external_llvm-614061bfb4fea3c1233ecf2676282e063724ae93.tar.gz
external_llvm-614061bfb4fea3c1233ecf2676282e063724ae93.tar.bz2
When performing a truncating store, it is sometimes possible to rearrange the
data in-register prior to saving to memory. When we reorder the data in memory we prevent the need to save multiple scalars to memory, making a single regular store. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@137238 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'test/CodeGen/X86/opt-shuff-tstore.ll')
-rw-r--r--test/CodeGen/X86/opt-shuff-tstore.ll39
1 files changed, 39 insertions, 0 deletions
diff --git a/test/CodeGen/X86/opt-shuff-tstore.ll b/test/CodeGen/X86/opt-shuff-tstore.ll
new file mode 100644
index 0000000..4596068
--- /dev/null
+++ b/test/CodeGen/X86/opt-shuff-tstore.ll
@@ -0,0 +1,39 @@
+; RUN: llc -mcpu=corei7 < %s -o - -promote-elements -mattr=+sse2,+sse41 | FileCheck %s
+
+; CHECK: func_4_8
+; A single memory write
+; CHECK: movd
+; CHECK-NEXT: ret
+define void @func_4_8(<4 x i8> %param, <4 x i8>* %p) {
+ %r = add <4 x i8> %param, <i8 1, i8 2, i8 3, i8 4>
+ store <4 x i8> %r, <4 x i8>* %p
+ ret void
+}
+
+; CHECK: func_4_16
+; CHECK: movq
+; CHECK-NEXT: ret
+define void @func_4_16(<4 x i16> %param, <4 x i16>* %p) {
+ %r = add <4 x i16> %param, <i16 1, i16 2, i16 3, i16 4>
+ store <4 x i16> %r, <4 x i16>* %p
+ ret void
+}
+
+; CHECK: func_8_8
+; CHECK: movq
+; CHECK-NEXT: ret
+define void @func_8_8(<8 x i8> %param, <8 x i8>* %p) {
+ %r = add <8 x i8> %param, <i8 1, i8 2, i8 3, i8 4, i8 1, i8 2, i8 3, i8 4>
+ store <8 x i8> %r, <8 x i8>* %p
+ ret void
+}
+
+; CHECK: func_2_32
+; CHECK: movq
+; CHECK-NEXT: ret
+define void @func_2_32(<2 x i32> %param, <2 x i32>* %p) {
+ %r = add <2 x i32> %param, <i32 1, i32 2>
+ store <2 x i32> %r, <2 x i32>* %p
+ ret void
+}
+