aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorHal Finkel <hfinkel@anl.gov>2012-10-30 19:47:37 +0000
committerHal Finkel <hfinkel@anl.gov>2012-10-30 19:47:37 +0000
commit8a69a95f913dadae92d2ce0b3ac551610bf868e0 (patch)
tree09ab18d5479231040fea2ddea06263ce8ce7db71
parentb33b34a7dc447cf52702b8892c9829344e81f73a (diff)
downloadexternal_llvm-8a69a95f913dadae92d2ce0b3ac551610bf868e0.zip
external_llvm-8a69a95f913dadae92d2ce0b3ac551610bf868e0.tar.gz
external_llvm-8a69a95f913dadae92d2ce0b3ac551610bf868e0.tar.bz2
BBVectorize: Fix a small bug introduced in r167042.
We need to make sure that we take the correct load/store alignment when the inputs are flipped. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@167044 91177308-0d34-0410-b5e6-96231b3b80d8
-rw-r--r--lib/Transforms/Vectorize/BBVectorize.cpp1
-rw-r--r--test/Transforms/BBVectorize/simple-ldstr.ll28
2 files changed, 28 insertions, 1 deletions
diff --git a/lib/Transforms/Vectorize/BBVectorize.cpp b/lib/Transforms/Vectorize/BBVectorize.cpp
index b29a45e..32a18f2 100644
--- a/lib/Transforms/Vectorize/BBVectorize.cpp
+++ b/lib/Transforms/Vectorize/BBVectorize.cpp
@@ -2472,7 +2472,6 @@ namespace {
Instruction *L = I, *H = J;
if (FlipMemInputs)
std::swap(H, L);
- FlipMemInputs = false;
unsigned NumOperands = I->getNumOperands();
SmallVector<Value *, 3> ReplacedOperands(NumOperands);
diff --git a/test/Transforms/BBVectorize/simple-ldstr.ll b/test/Transforms/BBVectorize/simple-ldstr.ll
index c1e6a09..6883e84 100644
--- a/test/Transforms/BBVectorize/simple-ldstr.ll
+++ b/test/Transforms/BBVectorize/simple-ldstr.ll
@@ -140,3 +140,31 @@ if.end:
; CHECK-AO-NOT: <2 x double>
}
+; Simple 3-pair chain with loads and stores
+define void @test5(double* %a, double* %b, double* %c) nounwind uwtable readonly {
+entry:
+ %i0 = load double* %a, align 8
+ %i1 = load double* %b, align 8
+ %mul = fmul double %i0, %i1
+ %arrayidx3 = getelementptr inbounds double* %a, i64 1
+ %i3 = load double* %arrayidx3, align 8
+ %arrayidx4 = getelementptr inbounds double* %b, i64 1
+ %i4 = load double* %arrayidx4, align 8
+ %mul5 = fmul double %i3, %i4
+ %arrayidx5 = getelementptr inbounds double* %c, i64 1
+ store double %mul5, double* %arrayidx5, align 8
+ store double %mul, double* %c, align 4
+ ret void
+; CHECK: @test5
+; CHECK: %i0.v.i0 = bitcast double* %a to <2 x double>*
+; CHECK: %i1.v.i0 = bitcast double* %b to <2 x double>*
+; CHECK: %i0 = load <2 x double>* %i0.v.i0, align 8
+; CHECK: %i1 = load <2 x double>* %i1.v.i0, align 8
+; CHECK: %mul = fmul <2 x double> %i0, %i1
+; CHECK: %0 = bitcast double* %c to <2 x double>*
+; CHECK: store <2 x double> %mul, <2 x double>* %0, align 4
+; CHECK: ret void
+; CHECK-AO: @test5
+; CHECK-AO-NOT: <2 x double>
+}
+