//
// This pass is a simple loop invariant code motion pass.
//
-// Note that this pass does NOT require pre-headers to exist on loops in the
-// CFG, but if there is not distinct preheader for a loop, the hoisted code will
-// be *DUPLICATED* in every basic block, outside of the loop, that preceeds the
-// loop header. Additionally, any use of one of these hoisted expressions
-// cannot be loop invariant itself, because the expression hoisted gets a PHI
-// node that is loop variant.
-//
-// For these reasons, and many more, it makes sense to run a pass before this
-// that ensures that there are preheaders on all loops. That said, we don't
-// REQUIRE it. :)
-//
//===----------------------------------------------------------------------===//
#include "llvm/Transforms/Scalar.h"
#include "llvm/Transforms/Utils/Local.h"
#include "llvm/Analysis/LoopInfo.h"
#include "llvm/Analysis/AliasAnalysis.h"
+#include "llvm/Analysis/Dominators.h"
#include "llvm/iOperators.h"
-#include "llvm/iPHINode.h"
#include "llvm/iMemory.h"
#include "llvm/Support/InstVisitor.h"
-#include "llvm/Support/CFG.h"
#include "Support/STLExtras.h"
#include "Support/StatisticReporter.h"
#include <algorithm>
using std::string;
-static Statistic<> NumHoistedNPH("licm\t\t- Number of insts hoisted to multiple"
- " loop preds (bad, no loop pre-header)");
-static Statistic<> NumHoistedPH("licm\t\t- Number of insts hoisted to a loop "
- "pre-header");
-static Statistic<> NumHoistedLoads("licm\t\t- Number of load insts hoisted");
-
namespace {
+ Statistic<>NumHoisted("licm\t\t- Number of instructions hoisted out of loop");
+ Statistic<> NumHoistedLoads("licm\t\t- Number of load insts hoisted");
+
struct LICM : public FunctionPass, public InstVisitor<LICM> {
virtual bool runOnFunction(Function &F);
- // This transformation requires natural loop information...
+ /// This transformation requires natural loop information & requires that
+ /// loop preheaders be inserted into the CFG...
+ ///
virtual void getAnalysisUsage(AnalysisUsage &AU) const {
AU.preservesCFG();
AU.addRequiredID(LoopPreheadersID);
AU.addRequired<LoopInfo>();
+ AU.addRequired<DominatorTree>();
AU.addRequired<AliasAnalysis>();
}
private:
- // List of predecessor blocks for the current loop - These blocks are where
- // we hoist loop invariants to for the current loop.
- //
- std::vector<BasicBlock*> LoopPreds, LoopBackEdges;
+ Loop *CurLoop; // The current loop we are working on...
+ BasicBlock *Preheader; // The preheader block of the current loop...
+ bool Changed; // Set to true when we change anything.
+ AliasAnalysis *AA; // Currently AliasAnalysis information
- Loop *CurLoop; // The current loop we are working on...
- bool Changed; // Set to true when we change anything.
- AliasAnalysis *AA; // Currently AliasAnalysis information
-
- // visitLoop - Hoist expressions out of the specified loop...
+ /// visitLoop - Hoist expressions out of the specified loop...
+ ///
void visitLoop(Loop *L);
- // notInCurrentLoop - Little predicate that returns true if the specified
- // basic block is in a subloop of the current one, not the current one
- // itself.
- //
- bool notInCurrentLoop(BasicBlock *BB) {
+ /// HoistRegion - Walk the specified region of the CFG (defined by all
+ /// blocks dominated by the specified block, and that are in the current
+ /// loop) in depth first order w.r.t the DominatorTree. This allows us to
+ /// visit defintions before uses, allowing us to hoist a loop body in one
+ /// pass without iteration.
+ ///
+ void HoistRegion(DominatorTree::Node *N);
+
+ /// inCurrentLoop - Little predicate that returns false if the specified
+ /// basic block is in a subloop of the current one, not the current one
+ /// itself.
+ ///
+ bool inCurrentLoop(BasicBlock *BB) {
for (unsigned i = 0, e = CurLoop->getSubLoops().size(); i != e; ++i)
if (CurLoop->getSubLoops()[i]->contains(BB))
- return true; // A subloop actually contains this block!
- return false;
+ return false; // A subloop actually contains this block!
+ return true;
}
- // hoist - When an instruction is found to only use loop invariant operands
- // that is safe to hoist, this instruction is called to do the dirty work.
- //
+ /// hoist - When an instruction is found to only use loop invariant operands
+ /// that is safe to hoist, this instruction is called to do the dirty work.
+ ///
void hoist(Instruction &I);
- // pointerInvalidatedByLoop - Return true if the body of this loop may store
- // into the memory location pointed to by V.
- //
+ /// pointerInvalidatedByLoop - Return true if the body of this loop may
+ /// store into the memory location pointed to by V.
+ ///
bool pointerInvalidatedByLoop(Value *V);
- // isLoopInvariant - Return true if the specified value is loop invariant
+ /// isLoopInvariant - Return true if the specified value is loop invariant
+ ///
inline bool isLoopInvariant(Value *V) {
if (Instruction *I = dyn_cast<Instruction>(V))
return !CurLoop->contains(I->getParent());
return true; // All non-instructions are loop invariant
}
- // visitBasicBlock - Run LICM on a particular block.
- void visitBasicBlock(BasicBlock *BB);
-
- // Instruction visitation handlers... these basically control whether or not
- // the specified instruction types are hoisted.
- //
+ /// Instruction visitation handlers... these basically control whether or
+ /// not the specified instruction types are hoisted.
+ ///
friend class InstVisitor<LICM>;
void visitBinaryOperator(Instruction &I) {
if (isLoopInvariant(I.getOperand(0)) && isLoopInvariant(I.getOperand(1)))
Pass *createLICMPass() { return new LICM(); }
+/// runOnFunction - For LICM, this simply traverses the loop structure of the
+/// function, hoisting expressions out of loops if possible.
+///
bool LICM::runOnFunction(Function &) {
- // get our loop information...
+ // Get information about the top level loops in the function...
const std::vector<Loop*> &TopLevelLoops =
getAnalysis<LoopInfo>().getTopLevelLoops();
return Changed;
}
+
+/// visitLoop - Hoist expressions out of the specified loop...
+///
void LICM::visitLoop(Loop *L) {
// Recurse through all subloops before we process this loop...
std::for_each(L->getSubLoops().begin(), L->getSubLoops().end(),
bind_obj(this, &LICM::visitLoop));
CurLoop = L;
- // Calculate the set of predecessors for this loop. The predecessors for this
- // loop are equal to the predecessors for the header node of the loop that are
- // not themselves in the loop.
- //
- BasicBlock *Header = L->getHeader();
-
- // Calculate the sets of predecessors and backedges of the loop...
- LoopBackEdges.insert(LoopBackEdges.end(),pred_begin(Header),pred_end(Header));
-
- std::vector<BasicBlock*>::iterator LPI =
- std::partition(LoopBackEdges.begin(), LoopBackEdges.end(),
- bind_obj(CurLoop, &Loop::contains));
-
- // Move all predecessors to the LoopPreds vector...
- LoopPreds.insert(LoopPreds.end(), LPI, LoopBackEdges.end());
+ // Get the preheader block to move instructions into...
+ Preheader = L->getLoopPreheader();
+ assert(Preheader&&"Preheader insertion pass guarantees we have a preheader!");
- // Remove predecessors from backedges list...
- LoopBackEdges.erase(LPI, LoopBackEdges.end());
-
-
- // The only way that there could be no predecessors to a loop is if the loop
- // is not reachable. Since we don't care about optimizing dead loops,
- // summarily ignore them.
- //
- if (LoopPreds.empty()) return;
-
// We want to visit all of the instructions in this loop... that are not parts
// of our subloops (they have already had their invariants hoisted out of
// their loop, into this loop, so there is no need to process the BODIES of
// the subloops).
//
- std::vector<BasicBlock*> BBs(L->getBlocks().begin(), L->getBlocks().end());
-
- // Remove blocks that are actually in subloops...
- BBs.erase(std::remove_if(BBs.begin(), BBs.end(),
- bind_obj(this, &LICM::notInCurrentLoop)), BBs.end());
-
- // Visit all of the basic blocks we have chosen, hoisting out the instructions
- // as neccesary. This leaves dead copies of the instruction in the loop
- // unfortunately...
+ // Traverse the body of the loop in depth first order on the dominator tree so
+ // that we are guaranteed to see definitions before we see uses. This allows
+ // us to perform the LICM transformation in one pass, without iteration.
//
- for_each(BBs.begin(), BBs.end(), bind_obj(this, &LICM::visitBasicBlock));
+ HoistRegion(getAnalysis<DominatorTree>()[L->getHeader()]);
// Clear out loops state information for the next iteration
CurLoop = 0;
- LoopPreds.clear();
- LoopBackEdges.clear();
+ Preheader = 0;
}
-void LICM::visitBasicBlock(BasicBlock *BB) {
- for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ) {
- visit(*I);
-
- if (dceInstruction(I))
- Changed = true;
- else
- ++I;
- }
-}
+/// HoistRegion - Walk the specified region of the CFG (defined by all blocks
+/// dominated by the specified block, and that are in the current loop) in depth
+/// first order w.r.t the DominatorTree. This allows us to visit defintions
+/// before uses, allowing us to hoist a loop body in one pass without iteration.
+///
+void LICM::HoistRegion(DominatorTree::Node *N) {
+ assert(N != 0 && "Null dominator tree node?");
+ // This subregion is not in the loop, it has already been already been hoisted
+ if (!inCurrentLoop(N->getNode()))
+ return;
-void LICM::hoist(Instruction &Inst) {
- if (Inst.use_empty()) return; // Don't (re) hoist dead instructions!
- //cerr << "Hoisting " << Inst;
+ visit(*N->getNode());
- BasicBlock *Header = CurLoop->getHeader();
+ const std::vector<DominatorTree::Node*> &Children = N->getChildren();
+ for (unsigned i = 0, e = Children.size(); i != e; ++i)
+ HoistRegion(Children[i]);
+}
- // Old instruction will be removed, so take it's name...
- string InstName = Inst.getName();
- Inst.setName("");
- if (isa<LoadInst>(Inst))
- ++NumHoistedLoads;
+/// hoist - When an instruction is found to only use loop invariant operands
+/// that is safe to hoist, this instruction is called to do the dirty work.
+///
+void LICM::hoist(Instruction &Inst) {
+ DEBUG(std::cerr << "LICM hoisting: " << Inst);
- // The common case is that we have a pre-header. Generate special case code
- // that is faster if that is the case.
- //
- if (LoopPreds.size() == 1) {
- BasicBlock *Pred = LoopPreds[0];
-
- // Create a new copy of the instruction, for insertion into Pred.
- Instruction *New = Inst.clone();
- New->setName(InstName);
-
- // Insert the new node in Pred, before the terminator.
- Pred->getInstList().insert(--Pred->end(), New);
-
- // Kill the old instruction...
- Inst.replaceAllUsesWith(New);
- ++NumHoistedPH;
-
- } else {
- // No loop pre-header, insert a PHI node into header to capture all of the
- // incoming versions of the value.
- //
- PHINode *LoopVal = new PHINode(Inst.getType(), InstName+".phi",
- Header->begin());
-
- // Insert cloned versions of the instruction into all of the loop preds.
- for (unsigned i = 0, e = LoopPreds.size(); i != e; ++i) {
- BasicBlock *Pred = LoopPreds[i];
-
- // Create a new copy of the instruction, for insertion into Pred.
- Instruction *New = Inst.clone();
- New->setName(InstName);
-
- // Insert the new node in Pred, before the terminator.
- Pred->getInstList().insert(--Pred->end(), New);
-
- // Add the incoming value to the PHI node.
- LoopVal->addIncoming(New, Pred);
- }
+ BasicBlock *Header = CurLoop->getHeader();
- // Add incoming values to the PHI node for all backedges in the loop...
- for (unsigned i = 0, e = LoopBackEdges.size(); i != e; ++i)
- LoopVal->addIncoming(LoopVal, LoopBackEdges[i]);
-
- // Replace all uses of the old version of the instruction in the loop with
- // the new version that is out of the loop. We know that this is ok,
- // because the new definition is in the loop header, which dominates the
- // entire loop body. The old definition was defined _inside_ of the loop,
- // so the scope cannot extend outside of the loop, so we're ok.
- //
- Inst.replaceAllUsesWith(LoopVal);
- ++NumHoistedNPH;
- }
+ // Remove the instruction from its current basic block... but don't delete the
+ // instruction.
+ Inst.getParent()->getInstList().remove(&Inst);
+ // Insert the new node in Preheader, before the terminator.
+ Preheader->getInstList().insert(Preheader->getTerminator(), &Inst);
+
+ ++NumHoisted;
Changed = true;
}
void LICM::visitLoadInst(LoadInst &LI) {
if (isLoopInvariant(LI.getOperand(0)) &&
- !pointerInvalidatedByLoop(LI.getOperand(0)))
+ !pointerInvalidatedByLoop(LI.getOperand(0))) {
hoist(LI);
-
+ ++NumHoistedLoads;
+ }
}
-// pointerInvalidatedByLoop - Return true if the body of this loop may store
-// into the memory location pointed to by V.
-//
+/// pointerInvalidatedByLoop - Return true if the body of this loop may store
+/// into the memory location pointed to by V.
+///
bool LICM::pointerInvalidatedByLoop(Value *V) {
// Check to see if any of the basic blocks in CurLoop invalidate V.
for (unsigned i = 0, e = CurLoop->getBlocks().size(); i != e; ++i)