diff options
Diffstat (limited to 'test/CodeGen/X86/x86-upgrade-avx-vbroadcast.ll')
-rw-r--r-- | test/CodeGen/X86/x86-upgrade-avx-vbroadcast.ll | 41 |
1 files changed, 41 insertions, 0 deletions
diff --git a/test/CodeGen/X86/x86-upgrade-avx-vbroadcast.ll b/test/CodeGen/X86/x86-upgrade-avx-vbroadcast.ll new file mode 100644 index 0000000..d885f1c --- /dev/null +++ b/test/CodeGen/X86/x86-upgrade-avx-vbroadcast.ll @@ -0,0 +1,41 @@ +; RUN: llc -mattr=+avx < %s | FileCheck %s + +; Check that we properly upgrade the AVX vbroadcast intrinsics to IR. The +; expectation is that we should still get the original instruction back that +; maps to the intrinsic. + +target datalayout = "e-m:o-i64:64-f80:128-n8:16:32:64-S128" +target triple = "x86_64-apple-macosx10.9.0" + +; CHECK-LABEL: test_mm_broadcast_ss: +define <4 x float> @test_mm_broadcast_ss(float* readonly %__a){ +entry: + %0 = bitcast float* %__a to i8* +; CHECK: vbroadcastss (%{{.*}}), %xmm + %1 = tail call <4 x float> @llvm.x86.avx.vbroadcast.ss(i8* %0) + ret <4 x float> %1 +} + +; CHECK-LABEL: test_mm256_broadcast_sd: +define <4 x double> @test_mm256_broadcast_sd(double* readonly %__a) { +entry: + %0 = bitcast double* %__a to i8* +; CHECK: vbroadcastsd (%{{.*}}), %ymm + %1 = tail call <4 x double> @llvm.x86.avx.vbroadcast.sd.256(i8* %0) + ret <4 x double> %1 +} + +; CHECK-LABEL: test_mm256_broadcast_ss: +define <8 x float> @test_mm256_broadcast_ss(float* readonly %__a) { +entry: + %0 = bitcast float* %__a to i8* +; CHECK: vbroadcastss (%{{.*}}), %ymm + %1 = tail call <8 x float> @llvm.x86.avx.vbroadcast.ss.256(i8* %0) + ret <8 x float> %1 +} + +declare <8 x float> @llvm.x86.avx.vbroadcast.ss.256(i8*) + +declare <4 x double> @llvm.x86.avx.vbroadcast.sd.256(i8*) + +declare <4 x float> @llvm.x86.avx.vbroadcast.ss(i8*) |