From: Andrew Trick Date: Thu, 11 Jul 2013 17:08:59 +0000 (+0000) Subject: indvars: Improve LFTR by eliminating truncation when comparing against a constant. X-Git-Url: http://demsky.eecs.uci.edu/git/?a=commitdiff_plain;h=53b28f86236fc548143656929f39f38d9dc83e06;p=oota-llvm.git indvars: Improve LFTR by eliminating truncation when comparing against a constant. Patch by Michele Scandale! Adds a special handling of the case where, during the loop exit condition rewriting, the exit value is a constant of bitwidth lower than the type of the induction variable: instead of introducing a trunc operation in order to match correctly the operand types, it allows to convert the constant value to an equivalent constant, depending on the initial value of the induction variable and the trip count, in order have an equivalent comparison between the induction variable and the new constant. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@186107 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/lib/Transforms/Scalar/IndVarSimplify.cpp b/lib/Transforms/Scalar/IndVarSimplify.cpp index df11e92c9ed..ddb5b270d0c 100644 --- a/lib/Transforms/Scalar/IndVarSimplify.cpp +++ b/lib/Transforms/Scalar/IndVarSimplify.cpp @@ -1612,10 +1612,29 @@ LinearFunctionTestReplace(Loop *L, << " IVCount:\t" << *IVCount << "\n"); IRBuilder<> Builder(BI); - if (SE->getTypeSizeInBits(CmpIndVar->getType()) - > SE->getTypeSizeInBits(ExitCnt->getType())) { - CmpIndVar = Builder.CreateTrunc(CmpIndVar, ExitCnt->getType(), - "lftr.wideiv"); + + unsigned CmpIndVarSize = SE->getTypeSizeInBits(CmpIndVar->getType()); + unsigned ExitCntSize = SE->getTypeSizeInBits(ExitCnt->getType()); + if (CmpIndVarSize > ExitCntSize) { + const SCEVAddRecExpr *AR = cast(SE->getSCEV(IndVar)); + const SCEV *ARStart = AR->getStart(); + const SCEV *ARStep = AR->getStepRecurrence(*SE); + if (isa(ARStart) && isa(IVCount)) { + const APInt &Start = cast(ARStart)->getValue()->getValue(); + const APInt &Count = cast(IVCount)->getValue()->getValue(); + + APInt NewLimit; + if (cast(ARStep)->getValue()->isNegative()) + NewLimit = Start - Count.zext(CmpIndVarSize); + else + NewLimit = Start + Count.zext(CmpIndVarSize); + ExitCnt = ConstantInt::get(CmpIndVar->getType(), NewLimit); + + DEBUG(dbgs() << " Widen RHS:\t" << *ExitCnt << "\n"); + } else { + CmpIndVar = Builder.CreateTrunc(CmpIndVar, ExitCnt->getType(), + "lftr.wideiv"); + } } Value *Cond = Builder.CreateICmp(P, CmpIndVar, ExitCnt, "exitcond"); diff --git a/test/Transforms/IndVarSimplify/exitcnt-const-arstart-const-opt.ll b/test/Transforms/IndVarSimplify/exitcnt-const-arstart-const-opt.ll new file mode 100644 index 00000000000..185a67f2822 --- /dev/null +++ b/test/Transforms/IndVarSimplify/exitcnt-const-arstart-const-opt.ll @@ -0,0 +1,25 @@ +;RUN: opt -S %s -indvars | FileCheck %s + +; Function Attrs: nounwind uwtable +define void @foo() #0 { +entry: + br label %for.body + +for.body: ; preds = %entry, %for.body + %i.01 = phi i16 [ 0, %entry ], [ %inc, %for.body ] + %conv2 = sext i16 %i.01 to i32 + call void @bar(i32 %conv2) #1 + %inc = add i16 %i.01, 1 +;CHECK-NOT: %lftr.wideiv = trunc i32 %indvars.iv.next to i16 +;CHECK: %exitcond = icmp ne i32 %indvars.iv.next, 512 + %cmp = icmp slt i16 %inc, 512 + br i1 %cmp, label %for.body, label %for.end + +for.end: ; preds = %for.body + ret void +} + +declare void @bar(i32) + +attributes #0 = { nounwind uwtable } +attributes #1 = { nounwind }