Modify the code that lowers shuffles to blends from using blendvXX to vblendXX.

blendv uses a register for the selection while vblend uses an immediate. On sandybridge they still have the same latency and execute on the same execution ports. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@154396 91177308-0d34-0410-b5e6-96231b3b80d8
author: Nadav Rotem <nadav.rotem@intel.com> 2012-04-10 14:33:13 +0000
committer: Nadav Rotem <nadav.rotem@intel.com> 2012-04-10 14:33:13 +0000
commit: 50e64cfe6e250dbe2528fc5bda75c68b04a8bc49 (patch)
tree: 11f8711c3c0c8a1418507063bde7ac8b81a7826f /test
parent: 45fb79bc54159330979bf24e4bfbdbb64bee1e2c (diff)
download: external_llvm-50e64cfe6e250dbe2528fc5bda75c68b04a8bc49.zip
external_llvm-50e64cfe6e250dbe2528fc5bda75c68b04a8bc49.tar.gz
external_llvm-50e64cfe6e250dbe2528fc5bda75c68b04a8bc49.tar.bz2
2 files changed, 6 insertions, 6 deletions
diff --git a/test/CodeGen/X86/avx-shuffle.ll b/test/CodeGen/X86/avx-shuffle.ll
index f323f3f..16c447b 100644
--- a/test/CodeGen/X86/avx-shuffle.ll
+++ b/test/CodeGen/X86/avx-shuffle.ll
@@ -164,7 +164,7 @@ i32 2, i32 4, i32 6, i32 8, i32 10, i32 12, i32 14, i32 16, i32 18, i32 20, i32
 }
 
 ; CHECK: blend1
-; CHECK: vblendvps
+; CHECK: vblendps
 ; CHECK: ret
 define <4 x i32> @blend1(<4 x i32> %a, <4 x i32> %b) nounwind alwaysinline {
   %t = shufflevector <4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 0, i32 1, i32 2, i32 7>
@@ -172,7 +172,7 @@ define <4 x i32> @blend1(<4 x i32> %a, <4 x i32> %b) nounwind alwaysinline {
 }
 
 ; CHECK: blend2
-; CHECK: vblendvps
+; CHECK: vblendps
 ; CHECK: ret
 define <4 x i32> @blend2(<4 x i32> %a, <4 x i32> %b) nounwind alwaysinline {
   %t = shufflevector <4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 0, i32 5, i32 2, i32 7>
@@ -180,7 +180,7 @@ define <4 x i32> @blend2(<4 x i32> %a, <4 x i32> %b) nounwind alwaysinline {
 }
 
 ; CHECK: blend2a
-; CHECK: vblendvps
+; CHECK: vblendps
 ; CHECK: ret
 define <4 x float> @blend2a(<4 x float> %a, <4 x float> %b) nounwind alwaysinline {
   %t = shufflevector <4 x float> %a, <4 x float> %b, <4 x i32> <i32 0, i32 5, i32 2, i32 7>
@@ -188,7 +188,7 @@ define <4 x float> @blend2a(<4 x float> %a, <4 x float> %b) nounwind alwaysinlin
 }
 
 ; CHECK: blend3
-; CHECK-NOT: vblendvps
+; CHECK-NOT: vblendps
 ; CHECK: ret
 define <4 x i32> @blend3(<4 x i32> %a, <4 x i32> %b) nounwind alwaysinline {
   %t = shufflevector <4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 1, i32 5, i32 2, i32 7>
@@ -196,7 +196,7 @@ define <4 x i32> @blend3(<4 x i32> %a, <4 x i32> %b) nounwind alwaysinline {
 }
 
 ; CHECK: blend4
-; CHECK: vblendvpd
+; CHECK: vblendpd
 ; CHECK: ret
 define <4 x i64> @blend4(<4 x i64> %a, <4 x i64> %b) nounwind alwaysinline {
   %t = shufflevector <4 x i64> %a, <4 x i64> %b, <4 x i32> <i32 0, i32 1, i32 2, i32 7>
diff --git a/test/CodeGen/X86/vec_shuffle-20.ll b/test/CodeGen/X86/vec_shuffle-20.ll
index fc06b95..107411e 100644
--- a/test/CodeGen/X86/vec_shuffle-20.ll
+++ b/test/CodeGen/X86/vec_shuffle-20.ll
@@ -1,4 +1,4 @@
-; RUN: llc < %s -o /dev/null -march=x86 -mattr=+sse2 -mtriple=i686-apple-darwin9 -stats -info-output-file - | grep asm-printer | grep 3
+; RUN: llc < %s -o /dev/null -march=x86 -mattr=+sse2 -mtriple=i686-apple-darwin9 -stats -info-output-file - | grep asm-printer | grep 2
 
 define <4 x float> @func(<4 x float> %fp0, <4 x float> %fp1) nounwind  {
 entry:
author	Nadav Rotem <nadav.rotem@intel.com>	2012-04-10 14:33:13 +0000
committer	Nadav Rotem <nadav.rotem@intel.com>	2012-04-10 14:33:13 +0000
commit	50e64cfe6e250dbe2528fc5bda75c68b04a8bc49 (patch)
tree	11f8711c3c0c8a1418507063bde7ac8b81a7826f /test
parent	45fb79bc54159330979bf24e4bfbdbb64bee1e2c (diff)
download	external_llvm-50e64cfe6e250dbe2528fc5bda75c68b04a8bc49.zip external_llvm-50e64cfe6e250dbe2528fc5bda75c68b04a8bc49.tar.gz external_llvm-50e64cfe6e250dbe2528fc5bda75c68b04a8bc49.tar.bz2