Use an enum instead of magic constants to improve readability.

[oota-llvm.git] / lib / Target / X86 / X86InstrInfo.cpp
diff --git a/lib/Target/X86/X86InstrInfo.cpp b/lib/Target/X86/X86InstrInfo.cpp

index f3ec067bdb328ef99116c8f541328fac3facd69b..7ba542c87520ff96fa03e8a61dda82585a5a7242 100644 (file)
--- a/lib/Target/X86/X86InstrInfo.cpp
+++ b/lib/Target/X86/X86InstrInfo.cpp
@@ -24,8 +24,8 @@
  #include "llvm/CodeGen/MachineFrameInfo.h"
  #include "llvm/CodeGen/MachineInstrBuilder.h"
  #include "llvm/CodeGen/MachineRegisterInfo.h"
-#include "llvm/DerivedTypes.h"
-#include "llvm/LLVMContext.h"
+#include "llvm/IR/DerivedTypes.h"
+#include "llvm/IR/LLVMContext.h"
  #include "llvm/MC/MCAsmInfo.h"
  #include "llvm/MC/MCInst.h"
  #include "llvm/Support/CommandLine.h"
@@ -467,9 +467,7 @@ X86InstrInfo::X86InstrInfo(X86TargetMachine &tm)
      { X86::RSQRTSSr,        X86::RSQRTSSm,            0 },
      { X86::RSQRTSSr_Int,    X86::RSQRTSSm_Int,        0 },
      { X86::SQRTPDr,         X86::SQRTPDm,             TB_ALIGN_16 },
-    { X86::SQRTPDr_Int,     X86::SQRTPDm_Int,         TB_ALIGN_16 },
      { X86::SQRTPSr,         X86::SQRTPSm,             TB_ALIGN_16 },
-    { X86::SQRTPSr_Int,     X86::SQRTPSm_Int,         TB_ALIGN_16 },
      { X86::SQRTSDr,         X86::SQRTSDm,             0 },
      { X86::SQRTSDr_Int,     X86::SQRTSDm_Int,         0 },
      { X86::SQRTSSr,         X86::SQRTSSm,             0 },
@@ -528,9 +526,7 @@ X86InstrInfo::X86InstrInfo(X86TargetMachine &tm)
      { X86::VRSQRTPSr,       X86::VRSQRTPSm,           0 },
      { X86::VRSQRTPSr_Int,   X86::VRSQRTPSm_Int,       0 },
      { X86::VSQRTPDr,        X86::VSQRTPDm,            0 },
-    { X86::VSQRTPDr_Int,    X86::VSQRTPDm_Int,        0 },
      { X86::VSQRTPSr,        X86::VSQRTPSm,            0 },
-    { X86::VSQRTPSr_Int,    X86::VSQRTPSm_Int,        0 },
      { X86::VUCOMISDrr,      X86::VUCOMISDrm,          0 },
      { X86::VUCOMISSrr,      X86::VUCOMISSrm,          0 },
      { X86::VBROADCASTSSrr,  X86::VBROADCASTSSrm,      TB_NO_REVERSE },
@@ -554,11 +550,8 @@ X86InstrInfo::X86InstrInfo(X86TargetMachine &tm)
      { X86::VRCPPSYr,        X86::VRCPPSYm,            0 },
      { X86::VRCPPSYr_Int,    X86::VRCPPSYm_Int,        0 },
      { X86::VRSQRTPSYr,      X86::VRSQRTPSYm,          0 },
-    { X86::VRSQRTPSYr_Int,  X86::VRSQRTPSYm_Int,      0 },
      { X86::VSQRTPDYr,       X86::VSQRTPDYm,           0 },
-    { X86::VSQRTPDYr_Int,   X86::VSQRTPDYm_Int,       0 },
      { X86::VSQRTPSYr,       X86::VSQRTPSYm,           0 },
-    { X86::VSQRTPSYr_Int,   X86::VSQRTPSYm_Int,       0 },
      { X86::VBROADCASTSSYrr, X86::VBROADCASTSSYrm,     TB_NO_REVERSE },
      { X86::VBROADCASTSDYrr, X86::VBROADCASTSDYrm,     TB_NO_REVERSE },
  
@@ -3662,7 +3655,16 @@ X86InstrInfo::foldMemoryOperandImpl(MachineFunction &MF,
                                      const SmallVectorImpl<MachineOperand> &MOs,
                                      unsigned Size, unsigned Align) const {
    const DenseMap<unsigned, std::pair<unsigned,unsigned> > *OpcodeTablePtr = 0;
+  bool isCallRegIndirect = TM.getSubtarget<X86Subtarget>().callRegIndirect();
    bool isTwoAddrFold = false;
+
+  // Atom favors register form of call. So, we do not fold loads into calls
+  // when X86Subtarget is Atom.
+  if (isCallRegIndirect &&
+    (MI->getOpcode() == X86::CALL32r || MI->getOpcode() == X86::CALL64r)) {
+    return NULL;
+  }
+
    unsigned NumOps = MI->getDesc().getNumOperands();
    bool isTwoAddr = NumOps > 1 &&
      MI->getDesc().getOperandConstraint(1, MCOI::TIED_TO) != -1;
@@ -3871,8 +3873,8 @@ MachineInstr* X86InstrInfo::foldMemoryOperandImpl(MachineFunction &MF,
  
    // Unless optimizing for size, don't fold to avoid partial
    // register update stalls
-  if (!MF.getFunction()->getFnAttributes().
-        hasAttribute(Attribute::OptimizeForSize) &&
+  if (!MF.getFunction()->getAttributes().
+        hasAttribute(AttributeSet::FunctionIndex, Attribute::OptimizeForSize) &&
        hasPartialRegUpdate(MI->getOpcode()))
      return 0;
  
@@ -3913,8 +3915,8 @@ MachineInstr* X86InstrInfo::foldMemoryOperandImpl(MachineFunction &MF,
  
    // Unless optimizing for size, don't fold to avoid partial
    // register update stalls
-  if (!MF.getFunction()->getFnAttributes().
-        hasAttribute(Attribute::OptimizeForSize) &&
+  if (!MF.getFunction()->getAttributes().
+        hasAttribute(AttributeSet::FunctionIndex, Attribute::OptimizeForSize) &&
        hasPartialRegUpdate(MI->getOpcode()))
      return 0;
  
@@ -4670,13 +4672,9 @@ bool X86InstrInfo::isHighLatencyDef(int opc) const {
    case X86::DIVSSrr:
    case X86::DIVSSrr_Int:
    case X86::SQRTPDm:
-  case X86::SQRTPDm_Int:
    case X86::SQRTPDr:
-  case X86::SQRTPDr_Int:
    case X86::SQRTPSm:
-  case X86::SQRTPSm_Int:
    case X86::SQRTPSr:
-  case X86::SQRTPSr_Int:
    case X86::SQRTSDm:
    case X86::SQRTSDm_Int:
    case X86::SQRTSDr:
@@ -4695,13 +4693,9 @@ bool X86InstrInfo::isHighLatencyDef(int opc) const {
    case X86::VDIVSSrr:
    case X86::VDIVSSrr_Int:
    case X86::VSQRTPDm:
-  case X86::VSQRTPDm_Int:
    case X86::VSQRTPDr:
-  case X86::VSQRTPDr_Int:
    case X86::VSQRTPSm:
-  case X86::VSQRTPSm_Int:
    case X86::VSQRTPSr:
-  case X86::VSQRTPSr_Int:
    case X86::VSQRTSDm:
    case X86::VSQRTSDm_Int:
    case X86::VSQRTSDr: