diff options
author | Vincent Lejeune <vljn@ovi.com> | 2013-06-04 23:17:15 +0000 |
---|---|---|
committer | Vincent Lejeune <vljn@ovi.com> | 2013-06-04 23:17:15 +0000 |
commit | e67a4afb5da59c02338622eea68e096ba143113f (patch) | |
tree | 73c85516285abe45df6f12fa2a7a2971eb555c31 /test/CodeGen/R600/dot4-folding.ll | |
parent | 00ed010d9ef388d718ac358132848661b286f7b0 (diff) | |
download | external_llvm-e67a4afb5da59c02338622eea68e096ba143113f.zip external_llvm-e67a4afb5da59c02338622eea68e096ba143113f.tar.gz external_llvm-e67a4afb5da59c02338622eea68e096ba143113f.tar.bz2 |
R600: Const/Neg/Abs can be folded to dot4
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@183278 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'test/CodeGen/R600/dot4-folding.ll')
-rw-r--r-- | test/CodeGen/R600/dot4-folding.ll | 27 |
1 files changed, 27 insertions, 0 deletions
diff --git a/test/CodeGen/R600/dot4-folding.ll b/test/CodeGen/R600/dot4-folding.ll new file mode 100644 index 0000000..3e8330f --- /dev/null +++ b/test/CodeGen/R600/dot4-folding.ll @@ -0,0 +1,27 @@ +;RUN: llc < %s -march=r600 -mcpu=redwood | FileCheck %s + +; Exactly one constant vector can be folded into dot4, which means exactly +; 4 MOV instructions +; CHECK: @main +; CHECK: MOV +; CHECK: MOV +; CHECK: MOV +; CHECK: MOV +; CHECK-NOT: MOV +; CHECK-NOT: MOV +; CHECK-NOT: MOV +; CHECK-NOT: MOV + +define void @main(float addrspace(1)* %out) { +main_body: + %0 = load <4 x float> addrspace(8)* null + %1 = load <4 x float> addrspace(8)* getelementptr ([1024 x <4 x float>] addrspace(8)* null, i64 0, i32 1) + %2 = call float @llvm.AMDGPU.dp4(<4 x float> %0,<4 x float> %1) + %3 = insertelement <4 x float> undef, float %2, i32 0 + call void @llvm.R600.store.swizzle(<4 x float> %3, i32 0, i32 0) + ret void +} + +declare float @llvm.AMDGPU.dp4(<4 x float>, <4 x float>) #1 +declare void @llvm.R600.store.swizzle(<4 x float>, i32, i32) +attributes #1 = { readnone } |