aboutsummaryrefslogtreecommitdiffstats
path: root/test/CodeGen/R600/dot4-folding.ll
diff options
context:
space:
mode:
authorVincent Lejeune <vljn@ovi.com>2013-06-04 23:17:15 +0000
committerVincent Lejeune <vljn@ovi.com>2013-06-04 23:17:15 +0000
commite67a4afb5da59c02338622eea68e096ba143113f (patch)
tree73c85516285abe45df6f12fa2a7a2971eb555c31 /test/CodeGen/R600/dot4-folding.ll
parent00ed010d9ef388d718ac358132848661b286f7b0 (diff)
downloadexternal_llvm-e67a4afb5da59c02338622eea68e096ba143113f.zip
external_llvm-e67a4afb5da59c02338622eea68e096ba143113f.tar.gz
external_llvm-e67a4afb5da59c02338622eea68e096ba143113f.tar.bz2
R600: Const/Neg/Abs can be folded to dot4
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@183278 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'test/CodeGen/R600/dot4-folding.ll')
-rw-r--r--test/CodeGen/R600/dot4-folding.ll27
1 files changed, 27 insertions, 0 deletions
diff --git a/test/CodeGen/R600/dot4-folding.ll b/test/CodeGen/R600/dot4-folding.ll
new file mode 100644
index 0000000..3e8330f
--- /dev/null
+++ b/test/CodeGen/R600/dot4-folding.ll
@@ -0,0 +1,27 @@
+;RUN: llc < %s -march=r600 -mcpu=redwood | FileCheck %s
+
+; Exactly one constant vector can be folded into dot4, which means exactly
+; 4 MOV instructions
+; CHECK: @main
+; CHECK: MOV
+; CHECK: MOV
+; CHECK: MOV
+; CHECK: MOV
+; CHECK-NOT: MOV
+; CHECK-NOT: MOV
+; CHECK-NOT: MOV
+; CHECK-NOT: MOV
+
+define void @main(float addrspace(1)* %out) {
+main_body:
+ %0 = load <4 x float> addrspace(8)* null
+ %1 = load <4 x float> addrspace(8)* getelementptr ([1024 x <4 x float>] addrspace(8)* null, i64 0, i32 1)
+ %2 = call float @llvm.AMDGPU.dp4(<4 x float> %0,<4 x float> %1)
+ %3 = insertelement <4 x float> undef, float %2, i32 0
+ call void @llvm.R600.store.swizzle(<4 x float> %3, i32 0, i32 0)
+ ret void
+}
+
+declare float @llvm.AMDGPU.dp4(<4 x float>, <4 x float>) #1
+declare void @llvm.R600.store.swizzle(<4 x float>, i32, i32)
+attributes #1 = { readnone }