[LV] Switch to using canonical induction variables.

author James Molloy <james.molloy@arm.com>

Wed, 2 Sep 2015 10:14:54 +0000 (10:14 +0000)

committer James Molloy <james.molloy@arm.com>

Wed, 2 Sep 2015 10:14:54 +0000 (10:14 +0000)
author James Molloy <james.molloy@arm.com>
Wed, 2 Sep 2015 10:14:54 +0000 (10:14 +0000)
committer James Molloy <james.molloy@arm.com>
Wed, 2 Sep 2015 10:14:54 +0000 (10:14 +0000)
diff --git a/lib/Transforms/Vectorize/LoopVectorize.cpp b/lib/Transforms/Vectorize/LoopVectorize.cpp

index eaa3ecd48e47a2060c13af8ad50b86b4d871c602..70199ace35cd3551e6aee6ac49e48533df81b84f 100644 (file)
--- a/lib/Transforms/Vectorize/LoopVectorize.cpp
+++ b/lib/Transforms/Vectorize/LoopVectorize.cpp
@@ -2652,15 +2652,8 @@ void InnerLoopVectorizer::createEmptyLoop() {
                        ConstantInt::get(ExitCountValue->getType(), VF * UF),
                        "min.iters.check", VectorPH->getTerminator());
  
-  // The loop index does not have to start at Zero. Find the original start
-  // value from the induction PHI node. If we don't have an induction variable
-  // then we know that it starts at zero.
    Builder.SetInsertPoint(VectorPH->getTerminator());
-  Value *StartIdx = ExtendedIdx =
-      OldInduction
-          ? Builder.CreateZExt(OldInduction->getIncomingValueForBlock(VectorPH),
-                               IdxTy)
-          : ConstantInt::get(IdxTy, 0);
+  Value *StartIdx = ExtendedIdx = ConstantInt::get(IdxTy, 0);
  
    // Count holds the overall loop count (N).
    Value *Count = Exp.expandCodeFor(ExitCount, ExitCount->getType(),
@@ -3542,10 +3535,8 @@ void InnerLoopVectorizer::widenPHIInstruction(Instruction *PN,
        } else {
          // Handle other induction variables that are now based on the
          // canonical one.
-        Value *NormalizedIdx = Builder.CreateSub(Induction, ExtendedIdx,
-                                                 "normalized.idx");
-        NormalizedIdx = Builder.CreateSExtOrTrunc(NormalizedIdx, PhiTy);
-        Broadcasted = II.transform(Builder, NormalizedIdx);
+        auto *V = Builder.CreateSExtOrTrunc(Induction, PhiTy);
+        Broadcasted = II.transform(Builder, V);
          Broadcasted->setName("offset.idx");
        }
        Broadcasted = getBroadcastInstrs(Broadcasted);
@@ -4134,10 +4125,13 @@ bool LoopVectorizationLegality::canVectorizeInstrs() {
  
            // Int inductions are special because we only allow one IV.
            if (ID.getKind() == InductionDescriptor::IK_IntInduction &&
-              ID.getStepValue()->isOne()) {
+              ID.getStepValue()->isOne() &&
+              isa<Constant>(ID.getStartValue()) &&
+                cast<Constant>(ID.getStartValue())->isNullValue()) {
              // Use the phi node with the widest type as induction. Use the last
              // one if there are multiple (no good reason for doing this other
-            // than it is expedient).
+            // than it is expedient). We've checked that it begins at zero and
+            // steps by one, so this is a canonical induction variable.
              if (!Induction || PhiTy == WidestIndTy)
                Induction = Phi;
            }
diff --git a/test/Transforms/LoopVectorize/induction.ll b/test/Transforms/LoopVectorize/induction.ll

index 48566ef92f7fdf5794083ae2647609673fc2a5ec..f8017dd110672705494134308968f8c18d6c3804 100644 (file)
--- a/test/Transforms/LoopVectorize/induction.ll
+++ b/test/Transforms/LoopVectorize/induction.ll
@@ -6,8 +6,7 @@ target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f3
  ; CHECK-LABEL: @multi_int_induction(
  ; CHECK: vector.body:
  ; CHECK:  %index = phi i64 [ 0, %vector.ph ], [ %index.next, %vector.body ]
-; CHECK:  %normalized.idx = sub i64 %index, 0
-; CHECK:  %[[VAR:.*]] = trunc i64 %normalized.idx to i32
+; CHECK:  %[[VAR:.*]] = trunc i64 %index to i32
  ; CHECK:  %offset.idx = add i32 190, %[[VAR]]
  define void @multi_int_induction(i32* %A, i32 %N) {
  for.body.lr.ph:
@@ -142,11 +141,10 @@ define i32 @max_i32_backedgetaken() nounwind readnone ssp uwtable {
  ; CHECK-LABEL: testoverflowcheck
  ; CHECK: entry
  ; CHECK: %[[LOAD:.*]] = load i8
-; CHECK: %[[VAL:.*]] =  zext i8 %[[LOAD]] to i32
  ; CHECK: br
  
  ; CHECK: scalar.ph
-; CHECK: phi i32 [ %{{.*}}, %middle.block ], [ %[[VAL]], %entry ]
+; CHECK: phi i8 [ %{{.*}}, %middle.block ], [ %[[LOAD]], %entry ]
  
  @e = global i8 1, align 1
  @d = common global i32 0, align 4
diff --git a/test/Transforms/LoopVectorize/reverse_induction.ll b/test/Transforms/LoopVectorize/reverse_induction.ll

index 6b63a0d8db6c42b7fddd13b920a5d22b7eca101d..88dd2e4d66ca5872936d0ff8c63dfd33b56d6127 100644 (file)
--- a/test/Transforms/LoopVectorize/reverse_induction.ll
+++ b/test/Transforms/LoopVectorize/reverse_induction.ll
@@ -96,8 +96,7 @@ loopend:
  ; CHECK-LABEL: @reverse_forward_induction_i64_i8(
  ; CHECK: vector.body
  ; CHECK: %index = phi i64 [ 0, %vector.ph ], [ %index.next, %vector.body ]
-; CHECK: %normalized.idx = sub i64 %index, 0
-; CHECK: %offset.idx = sub i64 1023, %normalized.idx
+; CHECK: %offset.idx = sub i64 1023, %index
  ; CHECK: trunc i64 %index to i8
  
  define void @reverse_forward_induction_i64_i8() {
@@ -122,10 +121,8 @@ while.end:
  
  ; CHECK-LABEL: @reverse_forward_induction_i64_i8_signed(
  ; CHECK: vector.body:
-; CHECK:  %index = phi i64 [ 129, %vector.ph ], [ %index.next, %vector.body ]
-; CHECK:  %normalized.idx = sub i64 %index, 129
-; CHECK:  %offset.idx = sub i64 1023, %normalized.idx
-; CHECK:  trunc i64 %index to i8
+; CHECK:  %index = phi i64 [ 0, %vector.ph ], [ %index.next, %vector.body ]
+; CHECK:  %offset.idx = sub i64 1023, %index
  
  define void @reverse_forward_induction_i64_i8_signed() {
  entry:
author	James Molloy <james.molloy@arm.com>
	Wed, 2 Sep 2015 10:14:54 +0000 (10:14 +0000)
committer	James Molloy <james.molloy@arm.com>
	Wed, 2 Sep 2015 10:14:54 +0000 (10:14 +0000)
lib/Transforms/Vectorize/LoopVectorize.cpp		patch \| blob \| history
test/Transforms/LoopVectorize/induction.ll		patch \| blob \| history
test/Transforms/LoopVectorize/reverse_induction.ll		patch \| blob \| history