Do not create calls via PLT in compilation callback - this is higly platform

[oota-llvm.git] / lib / Target / X86 / X86InstrInfo.cpp
diff --git a/lib/Target/X86/X86InstrInfo.cpp b/lib/Target/X86/X86InstrInfo.cpp

index 22f8b53e32883d9d4f0becd45cb8c5ea9c4497d4..1a7f06cbe3a1dec3fce76727464aca63e82a5b52 100644 (file)
--- a/lib/Target/X86/X86InstrInfo.cpp
+++ b/lib/Target/X86/X86InstrInfo.cpp
@@ -31,23 +31,21 @@
  #include "llvm/Support/ErrorHandling.h"
  #include "llvm/Support/raw_ostream.h"
  #include "llvm/Target/TargetOptions.h"
-#include "llvm/Target/TargetAsmInfo.h"
+#include "llvm/MC/MCAsmInfo.h"
  using namespace llvm;
  
-namespace {
-  cl::opt<bool>
-  NoFusing("disable-spill-fusing",
-           cl::desc("Disable fusing of spill code into instructions"));
-  cl::opt<bool>
-  PrintFailedFusing("print-failed-fuse-candidates",
-                    cl::desc("Print instructions that the allocator wants to"
-                             " fuse, but the X86 backend currently can't"),
-                    cl::Hidden);
-  cl::opt<bool>
-  ReMatPICStubLoad("remat-pic-stub-load",
-                   cl::desc("Re-materialize load from stub in PIC mode"),
-                   cl::init(false), cl::Hidden);
-}
+static cl::opt<bool>
+NoFusing("disable-spill-fusing",
+         cl::desc("Disable fusing of spill code into instructions"));
+static cl::opt<bool>
+PrintFailedFusing("print-failed-fuse-candidates",
+                  cl::desc("Print instructions that the allocator wants to"
+                           " fuse, but the X86 backend currently can't"),
+                  cl::Hidden);
+static cl::opt<bool>
+ReMatPICStubLoad("remat-pic-stub-load",
+                 cl::desc("Re-materialize load from stub in PIC mode"),
+                 cl::init(false), cl::Hidden);
  
  X86InstrInfo::X86InstrInfo(X86TargetMachine &tm)
    : TargetInstrInfoImpl(X86Insts, array_lengthof(X86Insts)),
@@ -1697,10 +1695,14 @@ bool X86InstrInfo::copyRegToReg(MachineBasicBlock &MBB,
      CommonRC = SrcRC;
    else if (!DestRC->hasSubClass(SrcRC)) {
      // Neither of GR64_NOREX or GR64_NOSP is a superclass of the other,
-    // but we want to copy then as GR64.
+    // but we want to copy then as GR64. Similarly, for GR32_NOREX and
+    // GR32_NOSP, copy as GR32.
      if (SrcRC->hasSuperClass(&X86::GR64RegClass) &&
          DestRC->hasSuperClass(&X86::GR64RegClass))
        CommonRC = &X86::GR64RegClass;
+    else if (SrcRC->hasSuperClass(&X86::GR32RegClass) &&
+             DestRC->hasSuperClass(&X86::GR32RegClass))
+      CommonRC = &X86::GR32RegClass;
      else
        CommonRC = 0;
    }
@@ -2033,6 +2035,7 @@ bool X86InstrInfo::spillCalleeSavedRegisters(MachineBasicBlock &MBB,
    if (MI != MBB.end()) DL = MI->getDebugLoc();
  
    bool is64Bit = TM.getSubtarget<X86Subtarget>().is64Bit();
+  bool isWin64 = TM.getSubtarget<X86Subtarget>().isTargetWin64();
    unsigned SlotSize = is64Bit ? 8 : 4;
  
    MachineFunction &MF = *MBB.getParent();
@@ -2049,7 +2052,7 @@ bool X86InstrInfo::spillCalleeSavedRegisters(MachineBasicBlock &MBB,
      if (Reg == FPReg)
        // X86RegisterInfo::emitPrologue will handle spilling of frame register.
        continue;
-    if (RegClass != &X86::VR128RegClass) {
+    if (RegClass != &X86::VR128RegClass && !isWin64) {
        CalleeFrameSize += SlotSize;
        BuildMI(MBB, MI, DL, get(Opc)).addReg(Reg, RegState::Kill);
      } else {
@@ -2073,6 +2076,7 @@ bool X86InstrInfo::restoreCalleeSavedRegisters(MachineBasicBlock &MBB,
    MachineFunction &MF = *MBB.getParent();
    unsigned FPReg = RI.getFrameRegister(MF);
    bool is64Bit = TM.getSubtarget<X86Subtarget>().is64Bit();
+  bool isWin64 = TM.getSubtarget<X86Subtarget>().isTargetWin64();
    unsigned Opc = is64Bit ? X86::POP64r : X86::POP32r;
    for (unsigned i = 0, e = CSI.size(); i != e; ++i) {
      unsigned Reg = CSI[i].getReg();
@@ -2080,7 +2084,7 @@ bool X86InstrInfo::restoreCalleeSavedRegisters(MachineBasicBlock &MBB,
        // X86RegisterInfo::emitEpilogue will handle restoring of frame register.
        continue;
      const TargetRegisterClass *RegClass = CSI[i].getRegClass();
-    if (RegClass != &X86::VR128RegClass) {
+    if (RegClass != &X86::VR128RegClass && !isWin64) {
        BuildMI(MBB, MI, DL, get(Opc), Reg);
      } else {
        loadRegFromStackSlot(MBB, MI, Reg, CSI[i].getFrameIdx(), RegClass);
@@ -2211,7 +2215,7 @@ X86InstrInfo::foldMemoryOperandImpl(MachineFunction &MF,
    
    // No fusion 
    if (PrintFailedFusing)
-    cerr << "We failed to fuse operand " << i << " in " << *MI;
+    errs() << "We failed to fuse operand " << i << " in " << *MI;
    return NULL;
  }
  
@@ -2295,7 +2299,8 @@ MachineInstr* X86InstrInfo::foldMemoryOperandImpl(MachineFunction &MF,
  
      // Create a v4i32 constant-pool entry.
      MachineConstantPool &MCP = *MF.getConstantPool();
-    const VectorType *Ty = VectorType::get(Type::Int32Ty, 4);
+    const VectorType *Ty =
+          VectorType::get(Type::getInt32Ty(MF.getFunction()->getContext()), 4);
      Constant *C = LoadMI->getOpcode() == X86::V_SET0 ?
                      Constant::getNullValue(Ty) :
                      Constant::getAllOnesValue(Ty);
@@ -2517,7 +2522,7 @@ X86InstrInfo::unfoldMemoryOperand(SelectionDAG &DAG, SDNode *N,
    SDNode *Load = 0;
    const MachineFunction &MF = DAG.getMachineFunction();
    if (FoldedLoad) {
-    MVT VT = *RC->vt_begin();
+    EVT VT = *RC->vt_begin();
      bool isAligned = (RI.getStackAlignment() >= 16) ||
        RI.needsStackRealignment(MF);
      Load = DAG.getTargetNode(getLoadRegOpcode(0, RC, isAligned, TM), dl,
@@ -2526,14 +2531,14 @@ X86InstrInfo::unfoldMemoryOperand(SelectionDAG &DAG, SDNode *N,
    }
  
    // Emit the data processing instruction.
-  std::vector<MVT> VTs;
+  std::vector<EVT> VTs;
    const TargetRegisterClass *DstRC = 0;
    if (TID.getNumDefs() > 0) {
      DstRC = TID.OpInfo[0].getRegClass(&RI);
      VTs.push_back(*DstRC->vt_begin());
    }
    for (unsigned i = 0, e = N->getNumValues(); i != e; ++i) {
-    MVT VT = N->getValueType(i);
+    EVT VT = N->getValueType(i);
      if (VT != MVT::Other && i >= (unsigned)TID.getNumDefs())
        VTs.push_back(VT);
    }
@@ -2923,6 +2928,10 @@ static unsigned GetInstSizeWithDesc(const MachineInstr &MI,
    case X86II::TA:  // 0F 3A
      Need0FPrefix = true;
      break;
+  case X86II::TF: // F2 0F 38
+    ++FinalSize;
+    Need0FPrefix = true;
+    break;
    case X86II::REP: break; // already handled.
    case X86II::XS:   // F3 0F
      ++FinalSize;
@@ -2958,6 +2967,9 @@ static unsigned GetInstSizeWithDesc(const MachineInstr &MI,
    case X86II::TA:  // 0F 3A
      ++FinalSize;
      break;
+  case X86II::TF: // F2 0F 38
+    ++FinalSize;
+    break;
    }
  
    // If this is a two-address instruction, skip one of the register operands.
@@ -2981,14 +2993,13 @@ static unsigned GetInstSizeWithDesc(const MachineInstr &MI,
        const MachineFunction *MF = MI.getParent()->getParent();
        const TargetInstrInfo &TII = *MF->getTarget().getInstrInfo();
        FinalSize += TII.getInlineAsmLength(MI.getOperand(0).getSymbolName(),
-                                          *MF->getTarget().getTargetAsmInfo());
+                                          *MF->getTarget().getMCAsmInfo());
        break;
      }
      case TargetInstrInfo::DBG_LABEL:
      case TargetInstrInfo::EH_LABEL:
        break;
      case TargetInstrInfo::IMPLICIT_DEF:
-    case TargetInstrInfo::DECLARE:
      case X86::DWARF_LOC:
      case X86::FP_REG_KILL:
        break;
@@ -3226,7 +3237,7 @@ unsigned X86InstrInfo::getGlobalBaseReg(MachineFunction *MF) const {
      GlobalBaseReg = RegInfo.createVirtualRegister(X86::GR32RegisterClass);
      // Generate addl $__GLOBAL_OFFSET_TABLE_ + [.-piclabel], %some_register
      BuildMI(FirstMBB, MBBI, DL, TII->get(X86::ADD32ri), GlobalBaseReg)
-      .addReg(PC).addExternalSymbol("_GLOBAL_OFFSET_TABLE_", 0,
+      .addReg(PC).addExternalSymbol("_GLOBAL_OFFSET_TABLE_",
                                      X86II::MO_GOT_ABSOLUTE_ADDRESS);
    } else {
      GlobalBaseReg = PC;