#include "Support/DepthFirstIterator.h"
#include "Support/Statistic.h"
#include "Support/STLExtras.h"
+#include <algorithm>
using namespace llvm;
namespace {
- Statistic<> numSpilled ("ra-linearscan", "Number of registers spilled");
- Statistic<> numReloaded("ra-linearscan", "Number of registers reloaded");
+ Statistic<> numStores("ra-linearscan", "Number of stores added");
+ Statistic<> numLoads ("ra-linearscan", "Number of loads added");
+
+ class PhysRegTracker {
+ private:
+ const MRegisterInfo* mri_;
+ std::vector<unsigned> regUse_;
- class RA : public MachineFunctionPass {
public:
- typedef std::vector<const LiveIntervals::Interval*> IntervalPtrs;
+ PhysRegTracker(MachineFunction* mf)
+ : mri_(mf ? mf->getTarget().getRegisterInfo() : NULL) {
+ if (mri_) {
+ regUse_.assign(mri_->getNumRegs(), 0);
+ }
+ }
+
+ PhysRegTracker(const PhysRegTracker& rhs)
+ : mri_(rhs.mri_),
+ regUse_(rhs.regUse_) {
+ }
+
+ const PhysRegTracker& operator=(const PhysRegTracker& rhs) {
+ mri_ = rhs.mri_;
+ regUse_ = rhs.regUse_;
+ return *this;
+ }
+
+ void addPhysRegUse(unsigned physReg) {
+ ++regUse_[physReg];
+ for (const unsigned* as = mri_->getAliasSet(physReg); *as; ++as) {
+ physReg = *as;
+ ++regUse_[physReg];
+ }
+ }
+ void delPhysRegUse(unsigned physReg) {
+ assert(regUse_[physReg] != 0);
+ --regUse_[physReg];
+ for (const unsigned* as = mri_->getAliasSet(physReg); *as; ++as) {
+ physReg = *as;
+ assert(regUse_[physReg] != 0);
+ --regUse_[physReg];
+ }
+ }
+
+ bool isPhysRegAvail(unsigned physReg) const {
+ return regUse_[physReg] == 0;
+ }
+ };
+
+ class RA : public MachineFunctionPass {
private:
MachineFunction* mf_;
const TargetMachine* tm_;
+ const TargetInstrInfo* tii_;
const MRegisterInfo* mri_;
- MachineBasicBlock* currentMbb_;
- MachineBasicBlock::iterator currentInstr_;
- typedef LiveIntervals::Intervals Intervals;
- const Intervals* li_;
- IntervalPtrs active_, inactive_;
-
- typedef std::vector<unsigned> Regs;
- Regs tempUseOperands_;
- Regs tempDefOperands_;
-
- typedef std::vector<bool> RegMask;
- RegMask reserved_;
+ LiveIntervals* li_;
+ typedef std::list<LiveIntervals::Interval*> IntervalPtrs;
+ IntervalPtrs unhandled_, fixed_, active_, inactive_, handled_;
- unsigned regUse_[MRegisterInfo::FirstVirtualRegister];
- unsigned regUseBackup_[MRegisterInfo::FirstVirtualRegister];
-
- typedef LiveIntervals::MachineBasicBlockPtrs MachineBasicBlockPtrs;
- MachineBasicBlockPtrs mbbs_;
+ PhysRegTracker prt_;
typedef std::map<unsigned, unsigned> Virt2PhysMap;
Virt2PhysMap v2pMap_;
int instrAdded_;
+ typedef std::vector<float> SpillWeights;
+ SpillWeights spillWeights_;
+
public:
+ RA()
+ : prt_(NULL) {
+
+ }
+
virtual const char* getPassName() const {
return "Linear Scan Register Allocator";
}
MachineFunctionPass::getAnalysisUsage(AU);
}
- private:
/// runOnMachineFunction - register allocate the whole function
bool runOnMachineFunction(MachineFunction&);
- /// verifyIntervals - verify that we have no inconsistencies
- /// in the register assignments we have in active and inactive
- /// lists
- bool verifyIntervals();
+ void releaseMemory();
+
+ private:
+ /// initIntervalSets - initializa the four interval sets:
+ /// unhandled, fixed, active and inactive
+ void initIntervalSets(LiveIntervals::Intervals& li);
/// processActiveIntervals - expire old intervals and move
/// non-overlapping ones to the incative list
- void processActiveIntervals(Intervals::const_iterator cur);
+ void processActiveIntervals(IntervalPtrs::value_type cur);
/// processInactiveIntervals - expire old intervals and move
/// overlapping ones to the active list
- void processInactiveIntervals(Intervals::const_iterator cur);
+ void processInactiveIntervals(IntervalPtrs::value_type cur);
+
+ /// updateSpillWeights - updates the spill weights of the
+ /// specifed physical register and its weight
+ void updateSpillWeights(unsigned reg, SpillWeights::value_type weight);
+
+ /// assignRegOrStackSlotAtInterval - assign a register if one
+ /// is available, or spill.
+ void assignRegOrStackSlotAtInterval(IntervalPtrs::value_type cur);
- /// assignStackSlotAtInterval - choose and spill
- /// interval. Currently we spill the interval with the last
- /// end point in the active and inactive lists and the current
- /// interval
- void assignStackSlotAtInterval(Intervals::const_iterator cur);
+ /// addSpillCode - adds spill code for interval. The interval
+ /// must be modified by LiveIntervals::updateIntervalForSpill.
+ void addSpillCode(IntervalPtrs::value_type li, int slot);
///
/// register handling helpers
/// getFreePhysReg - return a free physical register for this
/// virtual register interval if we have one, otherwise return
/// 0
- unsigned getFreePhysReg(Intervals::const_iterator cur);
-
- /// physRegAvailable - returns true if the specifed physical
- /// register is available
- bool physRegAvailable(unsigned physReg);
-
- /// tempPhysRegAvailable - returns true if the specifed
- /// temporary physical register is available
- bool tempPhysRegAvailable(unsigned physReg);
-
- /// getFreeTempPhysReg - return a free temprorary physical
- /// register for this virtual register if we have one (should
- /// never return 0)
- unsigned getFreeTempPhysReg(unsigned virtReg);
+ unsigned getFreePhysReg(IntervalPtrs::value_type cur);
/// assignVirt2PhysReg - assigns the free physical register to
/// the virtual register passed as arguments
- void assignVirt2PhysReg(unsigned virtReg, unsigned physReg);
+ Virt2PhysMap::iterator
+ assignVirt2PhysReg(unsigned virtReg, unsigned physReg);
/// clearVirtReg - free the physical register associated with this
/// virtual register and disassociate virtual->physical and
/// physical->virtual mappings
- void clearVirtReg(unsigned virtReg);
+ void clearVirtReg(Virt2PhysMap::iterator it);
/// assignVirt2StackSlot - assigns this virtual register to a
- /// stack slot
- void assignVirt2StackSlot(unsigned virtReg);
+ /// stack slot. returns the stack slot
+ int assignVirt2StackSlot(unsigned virtReg);
/// getStackSlot - returns the offset of the specified
/// register on the stack
int getStackSlot(unsigned virtReg);
- /// spillVirtReg - spills the virtual register
- void spillVirtReg(unsigned virtReg);
+ void printVirtRegAssignment() const {
+ std::cerr << "register assignment:\n";
- /// loadPhysReg - loads to the physical register the value of
- /// the virtual register specifed. Virtual register must have
- /// an assigned stack slot
- void loadVirt2PhysReg(unsigned virtReg, unsigned physReg);
-
- void markPhysRegFree(unsigned physReg);
- void markPhysRegNotFree(unsigned physReg);
-
- void backupRegUse() {
- memcpy(regUseBackup_, regUse_, sizeof(regUseBackup_));
- }
-
- void restoreRegUse() {
- memcpy(regUse_, regUseBackup_, sizeof(regUseBackup_));
- }
-
- void printVirt2PhysMap() const {
- std::cerr << "allocated registers:\n";
for (Virt2PhysMap::const_iterator
i = v2pMap_.begin(), e = v2pMap_.end(); i != e; ++i) {
- std::cerr << '[' << i->first << ','
+ assert(i->second != 0);
+ std::cerr << "[reg" << i->first << " -> "
<< mri_->getName(i->second) << "]\n";
}
+ for (Virt2StackSlotMap::const_iterator
+ i = v2ssMap_.begin(), e = v2ssMap_.end(); i != e; ++i) {
+ std::cerr << '[' << i->first << " -> ss#" << i->second << "]\n";
+ }
std::cerr << '\n';
}
+
void printIntervals(const char* const str,
RA::IntervalPtrs::const_iterator i,
RA::IntervalPtrs::const_iterator e) const {
if (str) std::cerr << str << " intervals:\n";
for (; i != e; ++i) {
- std::cerr << "\t\t" << **i << " -> ";
- if ((*i)->reg < MRegisterInfo::FirstVirtualRegister) {
- std::cerr << mri_->getName((*i)->reg);
- }
- else {
- std::cerr << mri_->getName(v2pMap_.find((*i)->reg)->second);
+ std::cerr << "\t" << **i << " -> ";
+ unsigned reg = (*i)->reg;
+ if (MRegisterInfo::isVirtualRegister(reg)) {
+ Virt2PhysMap::const_iterator it = v2pMap_.find(reg);
+ reg = (it == v2pMap_.end() ? 0 : it->second);
}
- std::cerr << '\n';
+ std::cerr << mri_->getName(reg) << '\n';
}
}
- void printFreeRegs(const char* const str,
- const TargetRegisterClass* rc) const {
- if (str) std::cerr << str << ':';
- for (TargetRegisterClass::iterator i =
- rc->allocation_order_begin(*mf_);
- i != rc->allocation_order_end(*mf_); ++i) {
- unsigned reg = *i;
- if (!regUse_[reg]) {
- std::cerr << ' ' << mri_->getName(reg);
- if (reserved_[reg]) std::cerr << "*";
- }
- }
- std::cerr << '\n';
+
+ void verifyAssignment() const {
+ for (Virt2PhysMap::const_iterator i = v2pMap_.begin(),
+ e = v2pMap_.end(); i != e; ++i)
+ for (Virt2PhysMap::const_iterator i2 = next(i); i2 != e; ++i2)
+ if (MRegisterInfo::isVirtualRegister(i->second) &&
+ (i->second == i2->second ||
+ mri_->areAliases(i->second, i2->second))) {
+ const LiveIntervals::Interval
+ &in = li_->getInterval(i->second),
+ &in2 = li_->getInterval(i2->second);
+ if (in.overlaps(in2)) {
+ std::cerr << in << " overlaps " << in2 << '\n';
+ assert(0);
+ }
+ }
}
};
}
+void RA::releaseMemory()
+{
+ v2pMap_.clear();
+ v2ssMap_.clear();
+ unhandled_.clear();
+ active_.clear();
+ inactive_.clear();
+ fixed_.clear();
+ handled_.clear();
+}
+
bool RA::runOnMachineFunction(MachineFunction &fn) {
mf_ = &fn;
tm_ = &fn.getTarget();
+ tii_ = &tm_->getInstrInfo();
mri_ = tm_->getRegisterInfo();
- li_ = &getAnalysis<LiveIntervals>().getIntervals();
- active_.clear();
- inactive_.clear();
-
- mbbs_ = getAnalysis<LiveIntervals>().getOrderedMachineBasicBlockPtrs();
- v2pMap_.clear();
- v2ssMap_.clear();
- memset(regUse_, 0, sizeof(regUse_));
- memset(regUseBackup_, 0, sizeof(regUseBackup_));
-
- DEBUG(
- unsigned i = 0;
- for (MachineBasicBlockPtrs::iterator
- mbbi = mbbs_.begin(), mbbe = mbbs_.end();
- mbbi != mbbe; ++mbbi) {
- MachineBasicBlock* mbb = *mbbi;
- std::cerr << mbb->getBasicBlock()->getName() << '\n';
- for (MachineBasicBlock::iterator
- ii = mbb->begin(), ie = mbb->end();
- ii != ie; ++ii) {
- MachineInstr* instr = *ii;
-
- std::cerr << i++ << "\t";
- instr->print(std::cerr, *tm_);
- }
+ li_ = &getAnalysis<LiveIntervals>();
+ prt_ = PhysRegTracker(mf_);
+
+ initIntervalSets(li_->getIntervals());
+
+ // linear scan algorithm
+ DEBUG(std::cerr << "********** LINEAR SCAN **********\n");
+ DEBUG(std::cerr << "********** Function: "
+ << mf_->getFunction()->getName() << '\n');
+
+ DEBUG(printIntervals("unhandled", unhandled_.begin(), unhandled_.end()));
+ DEBUG(printIntervals("fixed", fixed_.begin(), fixed_.end()));
+ DEBUG(printIntervals("active", active_.begin(), active_.end()));
+ DEBUG(printIntervals("inactive", inactive_.begin(), inactive_.end()));
+
+ while (!unhandled_.empty() || !fixed_.empty()) {
+ // pick the interval with the earliest start point
+ IntervalPtrs::value_type cur;
+ if (fixed_.empty()) {
+ cur = unhandled_.front();
+ unhandled_.pop_front();
}
- );
-
- // FIXME: this will work only for the X86 backend. I need to
- // device an algorthm to select the minimal (considering register
- // aliasing) number of temp registers to reserve so that we have 2
- // registers for each register class available.
-
- // reserve R32: EDI, EBX,
- // R16: DI, BX,
- // R8: BH, BL
- // RFP: FP5, FP6
- reserved_.assign(MRegisterInfo::FirstVirtualRegister, false);
- reserved_[19] = true; /* EDI */
- reserved_[17] = true; /* EBX */
- reserved_[12] = true; /* DI */
- reserved_[ 7] = true; /* BX */
- reserved_[ 4] = true; /* BH */
- reserved_[ 5] = true; /* BL */
- reserved_[28] = true; /* FP5 */
- reserved_[29] = true; /* FP6 */
-
- // liner scan algorithm
- for (Intervals::const_iterator
- i = li_->begin(), e = li_->end(); i != e; ++i) {
- DEBUG(std::cerr << "processing current interval: " << *i << '\n');
-
- DEBUG(printIntervals("\tactive", active_.begin(), active_.end()));
- DEBUG(printIntervals("\tinactive", inactive_.begin(), inactive_.end()));
- processActiveIntervals(i);
- processInactiveIntervals(i);
-
- backupRegUse();
-
- // for every interval in inactive we overlap mark the register
- // as not free
- for (IntervalPtrs::iterator j = inactive_.begin();
- j != inactive_.end(); ++j) {
- unsigned reg = (*j)->reg;
- if (reg >= MRegisterInfo::FirstVirtualRegister)
- reg = v2pMap_[reg];
-
- if (i->overlaps(**j)) {
- markPhysRegNotFree(reg);
- }
+ else if (unhandled_.empty()) {
+ cur = fixed_.front();
+ fixed_.pop_front();
}
-
- // for every pre-allocated interval in unhandled we overlap
- // mark the register as not free
- for (Intervals::const_iterator j = i + 1; j != e; ++j) {
- if (j->reg < MRegisterInfo::FirstVirtualRegister &&
- i->overlaps(*j))
- markPhysRegNotFree(j->reg);
+ else if (unhandled_.front()->start() < fixed_.front()->start()) {
+ cur = unhandled_.front();
+ unhandled_.pop_front();
}
+ else {
+ cur = fixed_.front();
+ fixed_.pop_front();
+ }
+
+ DEBUG(std::cerr << "\n*** CURRENT ***: " << *cur << '\n');
- DEBUG(std::cerr << "\tallocating current interval:\n");
- // if this register is preallocated reserve it
- if (i->reg < MRegisterInfo::FirstVirtualRegister) {
- restoreRegUse();
- markPhysRegNotFree(i->reg);
- active_.push_back(&*i);
+ processActiveIntervals(cur);
+ processInactiveIntervals(cur);
+
+ // if this register is fixed we are done
+ if (MRegisterInfo::isPhysicalRegister(cur->reg)) {
+ prt_.addPhysRegUse(cur->reg);
+ active_.push_back(cur);
+ handled_.push_back(cur);
}
// otherwise we are allocating a virtual register. try to find
// a free physical register or spill an interval in order to
// assign it one (we could spill the current though).
else {
- unsigned physReg = getFreePhysReg(i);
- if (!physReg) {
- assignStackSlotAtInterval(i);
- }
- else {
- restoreRegUse();
- assignVirt2PhysReg(i->reg, physReg);
- active_.push_back(&*i);
- }
+ assignRegOrStackSlotAtInterval(cur);
}
+
+ DEBUG(printIntervals("active", active_.begin(), active_.end()));
+ DEBUG(printIntervals("inactive", inactive_.begin(), inactive_.end()));
+ // DEBUG(verifyAssignment());
}
+
// expire any remaining active intervals
for (IntervalPtrs::iterator i = active_.begin(); i != active_.end(); ++i) {
unsigned reg = (*i)->reg;
- DEBUG(std::cerr << "\t\tinterval " << **i << " expired\n");
- if (reg >= MRegisterInfo::FirstVirtualRegister) {
+ DEBUG(std::cerr << "\tinterval " << **i << " expired\n");
+ if (MRegisterInfo::isVirtualRegister(reg)) {
reg = v2pMap_[reg];
}
- markPhysRegFree(reg);
+ prt_.delPhysRegUse(reg);
}
- DEBUG(std::cerr << "finished register allocation\n");
- DEBUG(printVirt2PhysMap());
+ DEBUG(printVirtRegAssignment());
- DEBUG(std::cerr << "Rewrite machine code:\n");
- for (MachineBasicBlockPtrs::iterator
- mbbi = mbbs_.begin(), mbbe = mbbs_.end(); mbbi != mbbe; ++mbbi) {
- instrAdded_ = 0;
- currentMbb_ = *mbbi;
-
- for (currentInstr_ = currentMbb_->begin();
- currentInstr_ != currentMbb_->end(); ++currentInstr_) {
+ DEBUG(std::cerr << "********** REWRITE MACHINE CODE **********\n");
+ DEBUG(std::cerr << "********** Function: "
+ << mf_->getFunction()->getName() << '\n');
- DEBUG(std::cerr << "\tinstruction: ";
- (*currentInstr_)->print(std::cerr, *tm_););
+ for (MachineFunction::iterator mbbi = mf_->begin(), mbbe = mf_->end();
+ mbbi != mbbe; ++mbbi) {
+ instrAdded_ = 0;
- // use our current mapping and actually replace and
+ for (MachineBasicBlock::iterator mii = mbbi->begin(), mie = mbbi->end();
+ mii != mie; ++mii) {
+ DEBUG(
+ std::cerr << '[';
+ unsigned index = li_->getInstructionIndex(mii);
+ if (index == std::numeric_limits<unsigned>::max())
+ std::cerr << '*';
+ else
+ std::cerr << index;
+ std::cerr << "]\t";
+ mii->print(std::cerr, *tm_));
+
+ // use our current mapping and actually replace every
// virtual register with its allocated physical registers
- DEBUG(std::cerr << "\t\treplacing virtual registers with mapped "
- "physical registers:\n");
- for (unsigned i = 0, e = (*currentInstr_)->getNumOperands();
+ DEBUG(std::cerr << "\t");
+ for (unsigned i = 0, e = mii->getNumOperands();
i != e; ++i) {
- MachineOperand& op = (*currentInstr_)->getOperand(i);
- if (op.isVirtualRegister()) {
- unsigned virtReg = op.getAllocatedRegNum();
- unsigned physReg = v2pMap_[virtReg];
- if (physReg) {
- DEBUG(std::cerr << "\t\t\t%reg" << virtReg
- << " -> " << mri_->getName(physReg) << '\n');
- (*currentInstr_)->SetMachineOperandReg(i, physReg);
- }
- }
- }
-
- DEBUG(std::cerr << "\t\tloading temporarily used operands to "
- "registers:\n");
- for (unsigned i = 0, e = (*currentInstr_)->getNumOperands();
- i != e; ++i) {
- MachineOperand& op = (*currentInstr_)->getOperand(i);
- if (op.isVirtualRegister() && op.isUse() && !op.isDef()) {
- unsigned virtReg = op.getAllocatedRegNum();
- unsigned physReg = v2pMap_[virtReg];
- if (!physReg) {
- physReg = getFreeTempPhysReg(virtReg);
- loadVirt2PhysReg(virtReg, physReg);
- tempUseOperands_.push_back(virtReg);
- }
- (*currentInstr_)->SetMachineOperandReg(i, physReg);
+ MachineOperand& op = mii->getOperand(i);
+ if (op.isRegister() &&
+ MRegisterInfo::isVirtualRegister(op.getReg())) {
+ unsigned virtReg = op.getReg();
+ Virt2PhysMap::iterator it = v2pMap_.find(virtReg);
+ assert(it != v2pMap_.end() &&
+ "all virtual registers must be allocated");
+ unsigned physReg = it->second;
+ assert(MRegisterInfo::isPhysicalRegister(physReg));
+ DEBUG(std::cerr << "\t[reg" << virtReg
+ << " -> " << mri_->getName(physReg) << ']');
+ mii->SetMachineOperandReg(i, physReg);
}
}
+ DEBUG(std::cerr << '\n');
+ }
+ }
- DEBUG(std::cerr << "\t\tclearing temporarily used operands:\n");
- for (unsigned i = 0, e = tempUseOperands_.size(); i != e; ++i) {
- clearVirtReg(tempUseOperands_[i]);
+ DEBUG(std::cerr << "********** MACHINEINSTRS **********\n");
+ DEBUG(
+ for (MachineFunction::iterator mbbi = mf_->begin(), mbbe = mf_->end();
+ mbbi != mbbe; ++mbbi) {
+ for (MachineBasicBlock::iterator mii = mbbi->begin(),
+ mie = mbbi->end(); mii != mie; ++mii) {
+ unsigned index = li_->getInstructionIndex(mii);
+ if (index == std::numeric_limits<unsigned>::max())
+ std::cerr << "*\t";
+ else
+ std::cerr << index << '\t';
+ mii->print(std::cerr, *tm_);
}
- tempUseOperands_.clear();
+ });
- DEBUG(std::cerr << "\t\tassigning temporarily defined operands to "
- "registers:\n");
- for (unsigned i = 0, e = (*currentInstr_)->getNumOperands();
- i != e; ++i) {
- MachineOperand& op = (*currentInstr_)->getOperand(i);
- if (op.isVirtualRegister() && op.isDef()) {
- unsigned virtReg = op.getAllocatedRegNum();
- unsigned physReg = v2pMap_[virtReg];
- if (!physReg) {
- physReg = getFreeTempPhysReg(virtReg);
- }
- if (op.isUse()) { // def and use
- loadVirt2PhysReg(virtReg, physReg);
- }
- else {
- assignVirt2PhysReg(virtReg, physReg);
- }
- tempDefOperands_.push_back(virtReg);
- (*currentInstr_)->SetMachineOperandReg(i, physReg);
- }
- }
+ return true;
+}
- DEBUG(std::cerr << "\t\tspilling temporarily defined operands "
- "of this instruction:\n");
- ++currentInstr_; // we want to insert after this instruction
- for (unsigned i = 0, e = tempDefOperands_.size(); i != e; ++i) {
- spillVirtReg(tempDefOperands_[i]);
- }
- --currentInstr_; // restore currentInstr_ iterator
- tempDefOperands_.clear();
- }
+void RA::initIntervalSets(LiveIntervals::Intervals& li)
+{
+ assert(unhandled_.empty() && fixed_.empty() &&
+ active_.empty() && inactive_.empty() &&
+ "interval sets should be empty on initialization");
+
+ for (LiveIntervals::Intervals::iterator i = li.begin(), e = li.end();
+ i != e; ++i) {
+ if (MRegisterInfo::isPhysicalRegister(i->reg))
+ fixed_.push_back(&*i);
+ else
+ unhandled_.push_back(&*i);
}
-
- return true;
}
-void RA::processActiveIntervals(Intervals::const_iterator cur)
+void RA::processActiveIntervals(IntervalPtrs::value_type cur)
{
DEBUG(std::cerr << "\tprocessing active intervals:\n");
for (IntervalPtrs::iterator i = active_.begin(); i != active_.end();) {
unsigned reg = (*i)->reg;
- // remove expired intervals. we expire earlier because this if
- // an interval expires this is going to be the last use. in
- // this case we can reuse the register for a def in the same
- // instruction
- if ((*i)->expiredAt(cur->start() + 1)) {
+ // remove expired intervals
+ if ((*i)->expiredAt(cur->start())) {
DEBUG(std::cerr << "\t\tinterval " << **i << " expired\n");
- if (reg >= MRegisterInfo::FirstVirtualRegister) {
+ if (MRegisterInfo::isVirtualRegister(reg)) {
reg = v2pMap_[reg];
}
- markPhysRegFree(reg);
+ prt_.delPhysRegUse(reg);
// remove from active
i = active_.erase(i);
}
// move inactive intervals to inactive list
else if (!(*i)->liveAt(cur->start())) {
- DEBUG(std::cerr << "\t\t\tinterval " << **i << " inactive\n");
- if (reg >= MRegisterInfo::FirstVirtualRegister) {
+ DEBUG(std::cerr << "\t\tinterval " << **i << " inactive\n");
+ if (MRegisterInfo::isVirtualRegister(reg)) {
reg = v2pMap_[reg];
}
- markPhysRegFree(reg);
+ prt_.delPhysRegUse(reg);
// add to inactive
inactive_.push_back(*i);
// remove from active
}
}
-void RA::processInactiveIntervals(Intervals::const_iterator cur)
+void RA::processInactiveIntervals(IntervalPtrs::value_type cur)
{
DEBUG(std::cerr << "\tprocessing inactive intervals:\n");
for (IntervalPtrs::iterator i = inactive_.begin(); i != inactive_.end();) {
unsigned reg = (*i)->reg;
- // remove expired intervals. we expire earlier because this if
- // an interval expires this is going to be the last use. in
- // this case we can reuse the register for a def in the same
- // instruction
- if ((*i)->expiredAt(cur->start() + 1)) {
- DEBUG(std::cerr << "\t\t\tinterval " << **i << " expired\n");
+ // remove expired intervals
+ if ((*i)->expiredAt(cur->start())) {
+ DEBUG(std::cerr << "\t\tinterval " << **i << " expired\n");
// remove from inactive
i = inactive_.erase(i);
}
// move re-activated intervals in active list
else if ((*i)->liveAt(cur->start())) {
- DEBUG(std::cerr << "\t\t\tinterval " << **i << " active\n");
- if (reg >= MRegisterInfo::FirstVirtualRegister) {
+ DEBUG(std::cerr << "\t\tinterval " << **i << " active\n");
+ if (MRegisterInfo::isVirtualRegister(reg)) {
reg = v2pMap_[reg];
}
- markPhysRegNotFree(reg);
+ prt_.addPhysRegUse(reg);
// add to active
active_.push_back(*i);
// remove from inactive
}
}
-namespace {
- template <typename T>
- void updateWeight(T rw[], int reg, T w)
- {
- if (rw[reg] == std::numeric_limits<T>::max() ||
- w == std::numeric_limits<T>::max())
- rw[reg] = std::numeric_limits<T>::max();
- else
- rw[reg] += w;
- }
+void RA::updateSpillWeights(unsigned reg, SpillWeights::value_type weight)
+{
+ spillWeights_[reg] += weight;
+ for (const unsigned* as = mri_->getAliasSet(reg); *as; ++as)
+ spillWeights_[*as] += weight;
}
-void RA::assignStackSlotAtInterval(Intervals::const_iterator cur)
+void RA::assignRegOrStackSlotAtInterval(IntervalPtrs::value_type cur)
{
- DEBUG(std::cerr << "\t\tassigning stack slot at interval "
- << *cur << ":\n");
+ DEBUG(std::cerr << "\tallocating current interval: ");
- // set all weights to zero
- float regWeight[MRegisterInfo::FirstVirtualRegister];
- for (unsigned i = 0; i < MRegisterInfo::FirstVirtualRegister; ++i)
- regWeight[i] = 0.0F;
+ PhysRegTracker backupPrt = prt_;
- // for each interval in active that overlaps
- for (IntervalPtrs::iterator i = active_.begin(); i != active_.end(); ++i) {
- if (!cur->overlaps(**i))
- continue;
+ spillWeights_.assign(mri_->getNumRegs(), 0.0);
+ // for each interval in active update spill weights
+ for (IntervalPtrs::const_iterator i = active_.begin(), e = active_.end();
+ i != e; ++i) {
unsigned reg = (*i)->reg;
- if (reg >= MRegisterInfo::FirstVirtualRegister) {
+ if (MRegisterInfo::isVirtualRegister(reg))
reg = v2pMap_[reg];
- }
- updateWeight(regWeight, reg, (*i)->weight);
- for (const unsigned* as = mri_->getAliasSet(reg); *as; ++as)
- updateWeight(regWeight, *as, (*i)->weight);
+ updateSpillWeights(reg, (*i)->weight);
}
- // for each interval in inactive that overlaps
- for (IntervalPtrs::iterator i = inactive_.begin();
- i != inactive_.end(); ++i) {
- if (!cur->overlaps(**i))
- continue;
+ // for every interval in inactive we overlap with, mark the
+ // register as not free and update spill weights
+ for (IntervalPtrs::const_iterator i = inactive_.begin(),
+ e = inactive_.end(); i != e; ++i) {
+ if (cur->overlaps(**i)) {
+ unsigned reg = (*i)->reg;
+ if (MRegisterInfo::isVirtualRegister(reg))
+ reg = v2pMap_[reg];
+ prt_.addPhysRegUse(reg);
+ updateSpillWeights(reg, (*i)->weight);
+ }
+ }
- unsigned reg = (*i)->reg;
- if (reg >= MRegisterInfo::FirstVirtualRegister) {
- reg = v2pMap_[reg];
+ // for every interval in fixed we overlap with,
+ // mark the register as not free and update spill weights
+ for (IntervalPtrs::const_iterator i = fixed_.begin(),
+ e = fixed_.end(); i != e; ++i) {
+ if (cur->overlaps(**i)) {
+ unsigned reg = (*i)->reg;
+ prt_.addPhysRegUse(reg);
+ updateSpillWeights(reg, (*i)->weight);
}
- updateWeight(regWeight, reg, (*i)->weight);
- for (const unsigned* as = mri_->getAliasSet(reg); *as; ++as)
- updateWeight(regWeight, *as, (*i)->weight);
}
- // for each fixed interval in unhandled that overlaps
- for (Intervals::const_iterator j = cur + 1; j != li_->end(); ++j) {
- if (j->reg >= MRegisterInfo::FirstVirtualRegister)
- continue;
- updateWeight(regWeight, j->reg, j->weight);
- for (const unsigned* as = mri_->getAliasSet(j->reg); *as; ++as)
- updateWeight(regWeight, *as, j->weight);
+ unsigned physReg = getFreePhysReg(cur);
+ // restore the physical register tracker
+ prt_ = backupPrt;
+ // if we find a free register, we are done: assign this virtual to
+ // the free physical register and add this interval to the active
+ // list.
+ if (physReg) {
+ DEBUG(std::cerr << mri_->getName(physReg) << '\n');
+ assignVirt2PhysReg(cur->reg, physReg);
+ active_.push_back(cur);
+ handled_.push_back(cur);
+ return;
}
+ DEBUG(std::cerr << "no free registers\n");
+
+ DEBUG(std::cerr << "\tassigning stack slot at interval "<< *cur << ":\n");
- float minWeight = std::numeric_limits<float>::max();
+ float minWeight = std::numeric_limits<float>::infinity();
unsigned minReg = 0;
const TargetRegisterClass* rc = mf_->getSSARegMap()->getRegClass(cur->reg);
for (TargetRegisterClass::iterator i = rc->allocation_order_begin(*mf_);
i != rc->allocation_order_end(*mf_); ++i) {
unsigned reg = *i;
- if (!reserved_[reg] && minWeight > regWeight[reg]) {
- minWeight = regWeight[reg];
+ if (minWeight > spillWeights_[reg]) {
+ minWeight = spillWeights_[reg];
minReg = reg;
}
}
+ DEBUG(std::cerr << "\t\tregister with min weight: "
+ << mri_->getName(minReg) << " (" << minWeight << ")\n");
+
+ // if the current has the minimum weight, we need to modify it,
+ // push it back in unhandled and let the linear scan algorithm run
+ // again
+ if (cur->weight <= minWeight) {
+ DEBUG(std::cerr << "\t\t\tspilling(c): " << *cur << '\n';);
+ int slot = assignVirt2StackSlot(cur->reg);
+ li_->updateSpilledInterval(*cur, slot);
+
+ // if we didn't eliminate the interval find where to add it
+ // back to unhandled. We need to scan since unhandled are
+ // sorted on earliest start point and we may have changed our
+ // start point.
+ if (!cur->empty()) {
+ addSpillCode(cur, slot);
+ IntervalPtrs::iterator it = unhandled_.begin();
+ while (it != unhandled_.end() && (*it)->start() < cur->start())
+ ++it;
+ unhandled_.insert(it, cur);
+ }
+ return;
+ }
+
+ // push the current interval back to unhandled since we are going
+ // to re-run at least this iteration. Since we didn't modify it it
+ // should go back right in the front of the list
+ unhandled_.push_front(cur);
- if (cur->weight < minWeight) {
- restoreRegUse();
- DEBUG(std::cerr << "\t\t\t\tspilling : " << mri_->getName(minReg)
- << ", weight: " << cur->weight << '\n');
- assignVirt2StackSlot(cur->reg);
+ // otherwise we spill all intervals aliasing the register with
+ // minimum weight, rollback to the interval with the earliest
+ // start point and let the linear scan algorithm run again
+ std::vector<bool> toSpill(mri_->getNumRegs(), false);
+ toSpill[minReg] = true;
+ for (const unsigned* as = mri_->getAliasSet(minReg); *as; ++as)
+ toSpill[*as] = true;
+ unsigned earliestStart = cur->start();
+
+ for (IntervalPtrs::iterator i = active_.begin(); i != active_.end(); ++i) {
+ unsigned reg = (*i)->reg;
+ if (MRegisterInfo::isVirtualRegister(reg) &&
+ toSpill[v2pMap_[reg]] &&
+ cur->overlaps(**i)) {
+ DEBUG(std::cerr << "\t\t\tspilling(a): " << **i << '\n');
+ earliestStart = std::min(earliestStart, (*i)->start());
+ int slot = assignVirt2StackSlot((*i)->reg);
+ li_->updateSpilledInterval(**i, slot);
+ addSpillCode(*i, slot);
+ }
}
- else {
- std::set<unsigned> toSpill;
- toSpill.insert(minReg);
- for (const unsigned* as = mri_->getAliasSet(minReg); *as; ++as)
- toSpill.insert(*as);
-
- std::vector<unsigned> spilled;
- for (IntervalPtrs::iterator i = active_.begin();
- i != active_.end(); ) {
- unsigned reg = (*i)->reg;
- if (reg >= MRegisterInfo::FirstVirtualRegister &&
- toSpill.find(v2pMap_[reg]) != toSpill.end() &&
- cur->overlaps(**i)) {
- spilled.push_back(v2pMap_[reg]);
- DEBUG(std::cerr << "\t\t\t\tspilling : "
- << mri_->getName(minReg) << ", weight: "
- << (*i)->weight << '\n');
- assignVirt2StackSlot(reg);
- i = active_.erase(i);
+ for (IntervalPtrs::iterator i = inactive_.begin();
+ i != inactive_.end(); ++i) {
+ unsigned reg = (*i)->reg;
+ if (MRegisterInfo::isVirtualRegister(reg) &&
+ toSpill[v2pMap_[reg]] &&
+ cur->overlaps(**i)) {
+ DEBUG(std::cerr << "\t\t\tspilling(i): " << **i << '\n');
+ earliestStart = std::min(earliestStart, (*i)->start());
+ int slot = assignVirt2StackSlot((*i)->reg);
+ li_->updateSpilledInterval(**i, slot);
+ addSpillCode(*i, slot);
+ }
+ }
+
+ DEBUG(std::cerr << "\t\trolling back to: " << earliestStart << '\n');
+ // scan handled in reverse order and undo each one, restoring the
+ // state of unhandled and fixed
+ while (!handled_.empty()) {
+ IntervalPtrs::value_type i = handled_.back();
+ // if this interval starts before t we are done
+ if (!i->empty() && i->start() < earliestStart)
+ break;
+ DEBUG(std::cerr << "\t\t\tundo changes for: " << *i << '\n');
+ handled_.pop_back();
+ IntervalPtrs::iterator it;
+ if ((it = find(active_.begin(), active_.end(), i)) != active_.end()) {
+ active_.erase(it);
+ if (MRegisterInfo::isPhysicalRegister(i->reg)) {
+ fixed_.push_front(i);
+ prt_.delPhysRegUse(i->reg);
}
else {
- ++i;
+ Virt2PhysMap::iterator v2pIt = v2pMap_.find(i->reg);
+ clearVirtReg(v2pIt);
+ prt_.delPhysRegUse(v2pIt->second);
+ if (i->spilled()) {
+ if (!i->empty()) {
+ IntervalPtrs::iterator it = unhandled_.begin();
+ while (it != unhandled_.end() &&
+ (*it)->start() < i->start())
+ ++it;
+ unhandled_.insert(it, i);
+ }
+ }
+ else
+ unhandled_.push_front(i);
+
}
}
- for (IntervalPtrs::iterator i = inactive_.begin();
- i != inactive_.end(); ) {
- unsigned reg = (*i)->reg;
- if (reg >= MRegisterInfo::FirstVirtualRegister &&
- toSpill.find(v2pMap_[reg]) != toSpill.end() &&
- cur->overlaps(**i)) {
- DEBUG(std::cerr << "\t\t\t\tspilling : "
- << mri_->getName(minReg) << ", weight: "
- << (*i)->weight << '\n');
- assignVirt2StackSlot(reg);
- i = inactive_.erase(i);
+ else if ((it = find(inactive_.begin(), inactive_.end(), i)) != inactive_.end()) {
+ inactive_.erase(it);
+ if (MRegisterInfo::isPhysicalRegister(i->reg))
+ fixed_.push_front(i);
+ else {
+ Virt2PhysMap::iterator v2pIt = v2pMap_.find(i->reg);
+ clearVirtReg(v2pIt);
+ if (i->spilled()) {
+ if (!i->empty()) {
+ IntervalPtrs::iterator it = unhandled_.begin();
+ while (it != unhandled_.end() &&
+ (*it)->start() < i->start())
+ ++it;
+ unhandled_.insert(it, i);
+ }
+ }
+ else
+ unhandled_.push_front(i);
}
+ }
+ else {
+ if (MRegisterInfo::isPhysicalRegister(i->reg))
+ fixed_.push_front(i);
else {
- ++i;
+ Virt2PhysMap::iterator v2pIt = v2pMap_.find(i->reg);
+ clearVirtReg(v2pIt);
+ unhandled_.push_front(i);
}
}
-
- unsigned physReg = getFreePhysReg(cur);
- assert(physReg && "no free physical register after spill?");
-
- restoreRegUse();
- for (unsigned i = 0; i < spilled.size(); ++i)
- markPhysRegFree(spilled[i]);
-
- assignVirt2PhysReg(cur->reg, physReg);
- active_.push_back(&*cur);
}
-}
-
-bool RA::physRegAvailable(unsigned physReg)
-{
- assert(!reserved_[physReg] &&
- "cannot call this method with a reserved register");
- return !regUse_[physReg];
-}
-
-unsigned RA::getFreePhysReg(Intervals::const_iterator cur)
-{
- DEBUG(std::cerr << "\t\tgetting free physical register: ");
-
- const TargetRegisterClass* rc = mf_->getSSARegMap()->getRegClass(cur->reg);
- for (TargetRegisterClass::iterator i = rc->allocation_order_begin(*mf_);
- i != rc->allocation_order_end(*mf_); ++i) {
- unsigned reg = *i;
- if (!reserved_[reg] && !regUse_[reg]) {
- DEBUG(std::cerr << mri_->getName(reg) << '\n');
- return reg;
+ // scan the rest and undo each interval that expired after t and
+ // insert it in active (the next iteration of the algorithm will
+ // put it in inactive if required)
+ IntervalPtrs::iterator i = handled_.begin(), e = handled_.end();
+ for (; i != e; ++i) {
+ if (!(*i)->expiredAt(earliestStart) && (*i)->expiredAt(cur->start())) {
+ DEBUG(std::cerr << "\t\t\tundo changes for: " << **i << '\n');
+ active_.push_back(*i);
+ if (MRegisterInfo::isPhysicalRegister((*i)->reg))
+ prt_.addPhysRegUse((*i)->reg);
+ else {
+ assert(v2pMap_.count((*i)->reg));
+ prt_.addPhysRegUse(v2pMap_.find((*i)->reg)->second);
+ }
}
}
-
- DEBUG(std::cerr << "no free register\n");
- return 0;
}
-bool RA::tempPhysRegAvailable(unsigned physReg)
+void RA::addSpillCode(IntervalPtrs::value_type li, int slot)
{
- assert(reserved_[physReg] &&
- "cannot call this method with a not reserved temp register");
+ // We scan the instructions corresponding to each range. We load
+ // when we have a use and spill at end of basic blocks or end of
+ // ranges only if the register was modified.
+ const TargetRegisterClass* rc = mf_->getSSARegMap()->getRegClass(li->reg);
+
+ for (LiveIntervals::Interval::Ranges::iterator i = li->ranges.begin(),
+ e = li->ranges.end(); i != e; ++i) {
+ unsigned index = i->first;
+ unsigned end = i->second;
+
+ bool loaded = false;
+
+ // skip deleted instructions. getInstructionFromIndex returns
+ // null if the instruction was deleted (because of coalescing
+ // for example)
+ while (!li_->getInstructionFromIndex(index))
+ index += LiveIntervals::InstrSlots::NUM;
+ MachineBasicBlock::iterator mi = li_->getInstructionFromIndex(index);
+ MachineBasicBlock* mbb = mi->getParent();
+ assert(mbb && "machine instruction not bound to basic block");
+
+ for (; index < end; index += LiveIntervals::InstrSlots::NUM) {
+ // ignore deleted instructions
+ while (!li_->getInstructionFromIndex(index)) index += 2;
+ mi = li_->getInstructionFromIndex(index);
+ DEBUG(std::cerr << "\t\t\t\texamining: \t\t\t\t\t"
+ << LiveIntervals::getBaseIndex(index) << '\t';
+ mi->print(std::cerr, *tm_));
+
+ // if it is used in this instruction load it
+ for (unsigned i = 0; i < mi->getNumOperands(); ++i) {
+ MachineOperand& mop = mi->getOperand(i);
+ if (mop.isRegister() && mop.getReg() == li->reg &&
+ mop.isUse() && !loaded) {
+ loaded = true;
+ mri_->loadRegFromStackSlot(*mbb, mi, li->reg, slot, rc);
+ ++numLoads;
+ DEBUG(std::cerr << "\t\t\t\tadded load for reg" << li->reg
+ << " from ss#" << slot << " before: \t"
+ << LiveIntervals::getBaseIndex(index) << '\t';
+ mi->print(std::cerr, *tm_));
+ }
+ }
- return !regUse_[physReg];
+ // if it is defined in this instruction mark as dirty
+ for (unsigned i = 0; i < mi->getNumOperands(); ++i) {
+ MachineOperand& mop = mi->getOperand(i);
+ if (mop.isRegister() && mop.getReg() == li->reg &&
+ mop.isDef()) {
+ loaded = true;
+
+ mri_->storeRegToStackSlot(*mbb, next(mi), li->reg, slot,rc);
+ ++numStores;
+ DEBUG(std::cerr << "\t\t\t\tadded store for reg" << li->reg
+ << " to ss#" << slot << " after: \t\t"
+ << LiveIntervals::getBaseIndex(index) << " \t";
+ prior(mi,2)->print(std::cerr, *tm_));
+ }
+ }
+ }
+ }
}
-unsigned RA::getFreeTempPhysReg(unsigned virtReg)
+unsigned RA::getFreePhysReg(IntervalPtrs::value_type cur)
{
- DEBUG(std::cerr << "\t\tgetting free temporary physical register: ");
+ const TargetRegisterClass* rc = mf_->getSSARegMap()->getRegClass(cur->reg);
- const TargetRegisterClass* rc = mf_->getSSARegMap()->getRegClass(virtReg);
- // go in reverse allocation order for the temp registers
- for (TargetRegisterClass::iterator i = rc->allocation_order_end(*mf_) - 1;
- i != rc->allocation_order_begin(*mf_) - 1; --i) {
+ for (TargetRegisterClass::iterator i = rc->allocation_order_begin(*mf_);
+ i != rc->allocation_order_end(*mf_); ++i) {
unsigned reg = *i;
- if (reserved_[reg] && !regUse_[reg]) {
- DEBUG(std::cerr << mri_->getName(reg) << '\n');
+ if (prt_.isPhysRegAvail(reg))
return reg;
- }
}
-
- assert(0 && "no free temporary physical register?");
return 0;
}
-void RA::assignVirt2PhysReg(unsigned virtReg, unsigned physReg)
+RA::Virt2PhysMap::iterator
+RA::assignVirt2PhysReg(unsigned virtReg, unsigned physReg)
{
- v2pMap_[virtReg] = physReg;
- markPhysRegNotFree(physReg);
+ bool inserted;
+ Virt2PhysMap::iterator it;
+ tie(it, inserted) = v2pMap_.insert(std::make_pair(virtReg, physReg));
+ assert(inserted && "attempting to assign a virt->phys mapping to an "
+ "already mapped register");
+ prt_.addPhysRegUse(physReg);
+ return it;
}
-void RA::clearVirtReg(unsigned virtReg)
+void RA::clearVirtReg(Virt2PhysMap::iterator it)
{
- Virt2PhysMap::iterator it = v2pMap_.find(virtReg);
assert(it != v2pMap_.end() &&
"attempting to clear a not allocated virtual register");
unsigned physReg = it->second;
- markPhysRegFree(physReg);
- v2pMap_[virtReg] = 0; // this marks that this virtual register
- // lives on the stack
+ v2pMap_.erase(it);
DEBUG(std::cerr << "\t\t\tcleared register " << mri_->getName(physReg)
<< "\n");
}
-void RA::assignVirt2StackSlot(unsigned virtReg)
+
+int RA::assignVirt2StackSlot(unsigned virtReg)
{
const TargetRegisterClass* rc = mf_->getSSARegMap()->getRegClass(virtReg);
int frameIndex = mf_->getFrameInfo()->CreateStackObject(rc);
bool inserted = v2ssMap_.insert(std::make_pair(virtReg, frameIndex)).second;
- assert(inserted &&
- "attempt to assign stack slot to already assigned register?");
- // if the virtual register was previously assigned clear the mapping
- // and free the virtual register
- if (v2pMap_.find(virtReg) != v2pMap_.end()) {
- clearVirtReg(virtReg);
- }
- else {
- v2pMap_[virtReg] = 0; // this marks that this virtual register
- // lives on the stack
- }
+ assert(inserted && "attempt to assign stack slot to spilled register!");
+ return frameIndex;
}
int RA::getStackSlot(unsigned virtReg)
{
- // use lower_bound so that we can do a possibly O(1) insert later
- // if necessary
- Virt2StackSlotMap::iterator it = v2ssMap_.find(virtReg);
- assert(it != v2ssMap_.end() &&
- "attempt to get stack slot on register that does not live on the stack");
- return it->second;
-}
-
-void RA::spillVirtReg(unsigned virtReg)
-{
- DEBUG(std::cerr << "\t\t\tspilling register: " << virtReg);
- const TargetRegisterClass* rc = mf_->getSSARegMap()->getRegClass(virtReg);
- int frameIndex = getStackSlot(virtReg);
- DEBUG(std::cerr << " to stack slot #" << frameIndex << '\n');
- ++numSpilled;
- instrAdded_ += mri_->storeRegToStackSlot(*currentMbb_, currentInstr_,
- v2pMap_[virtReg], frameIndex, rc);
- clearVirtReg(virtReg);
-}
-
-void RA::loadVirt2PhysReg(unsigned virtReg, unsigned physReg)
-{
- DEBUG(std::cerr << "\t\t\tloading register: " << virtReg);
- const TargetRegisterClass* rc = mf_->getSSARegMap()->getRegClass(virtReg);
- int frameIndex = getStackSlot(virtReg);
- DEBUG(std::cerr << " from stack slot #" << frameIndex << '\n');
- ++numReloaded;
- instrAdded_ += mri_->loadRegFromStackSlot(*currentMbb_, currentInstr_,
- physReg, frameIndex, rc);
- assignVirt2PhysReg(virtReg, physReg);
-}
-
-void RA::markPhysRegFree(unsigned physReg)
-{
- assert(regUse_[physReg] != 0);
- --regUse_[physReg];
- for (const unsigned* as = mri_->getAliasSet(physReg); *as; ++as) {
- physReg = *as;
- assert(regUse_[physReg] != 0);
- --regUse_[physReg];
- }
-}
-
-void RA::markPhysRegNotFree(unsigned physReg)
-{
- ++regUse_[physReg];
- for (const unsigned* as = mri_->getAliasSet(physReg); *as; ++as) {
- physReg = *as;
- ++regUse_[physReg];
- }
+ assert(v2ssMap_.count(virtReg) &&
+ "attempt to get stack slot for a non spilled register");
+ return v2ssMap_.find(virtReg)->second;
}
FunctionPass* llvm::createLinearScanRegisterAllocator() {