[X86] Generate .cfi_adjust_cfa_offset correctly when pushing arguments

[oota-llvm.git] / lib / Target / X86 / X86TargetMachine.cpp
diff --git a/lib/Target/X86/X86TargetMachine.cpp b/lib/Target/X86/X86TargetMachine.cpp

index 11f6fd17ec651c8920446d1f45db8289d095b9d6..2e869eb7c3cd6eaf34b0d2b68d8cbae06f5ecab0 100644 (file)
--- a/lib/Target/X86/X86TargetMachine.cpp
+++ b/lib/Target/X86/X86TargetMachine.cpp
@@ -14,19 +14,31 @@
  #include "X86TargetMachine.h"
  #include "X86.h"
  #include "X86TargetObjectFile.h"
+#include "X86TargetTransformInfo.h"
  #include "llvm/CodeGen/Passes.h"
  #include "llvm/IR/Function.h"
-#include "llvm/PassManager.h"
+#include "llvm/IR/LegacyPassManager.h"
  #include "llvm/Support/CommandLine.h"
  #include "llvm/Support/FormattedStream.h"
  #include "llvm/Support/TargetRegistry.h"
  #include "llvm/Target/TargetOptions.h"
  using namespace llvm;
  
+static cl::opt<bool> EnableMachineCombinerPass("x86-machine-combiner",
+                               cl::desc("Enable the machine combiner pass"),
+                               cl::init(true), cl::Hidden);
+
+namespace llvm {
+void initializeWinEHStatePassPass(PassRegistry &);
+}
+
  extern "C" void LLVMInitializeX86Target() {
    // Register the target.
    RegisterTargetMachine<X86TargetMachine> X(TheX86_32Target);
    RegisterTargetMachine<X86TargetMachine> Y(TheX86_64Target);
+
+  PassRegistry &PR = *PassRegistry::getPassRegistry();
+  initializeWinEHStatePassPass(PR);
  }
  
  static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) {
@@ -36,11 +48,11 @@ static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) {
      return make_unique<TargetLoweringObjectFileMachO>();
    }
  
-  if (TT.isOSLinux())
-    return make_unique<X86LinuxTargetObjectFile>();
+  if (TT.isOSLinux() || TT.isOSNaCl())
+    return make_unique<X86LinuxNaClTargetObjectFile>();
    if (TT.isOSBinFormatELF())
-    return make_unique<TargetLoweringObjectFileELF>();
-  if (TT.isKnownWindowsMSVCEnvironment())
+    return make_unique<X86ELFTargetObjectFile>();
+  if (TT.isKnownWindowsMSVCEnvironment() || TT.isWindowsCoreCLREnvironment())
      return make_unique<X86WindowsTargetObjectFile>();
    if (TT.isOSBinFormatCOFF())
      return make_unique<TargetLoweringObjectFileCOFF>();
@@ -80,7 +92,7 @@ static std::string computeDataLayout(const Triple &TT) {
  
    // The stack is aligned to 32 bits on some ABIs and 128 bits on others.
    if (!TT.isArch64Bit() && TT.isOSWindows())
-    Ret += "-S32";
+    Ret += "-a:0:32-S32";
    else
      Ret += "-S128";
  
@@ -89,18 +101,15 @@ static std::string computeDataLayout(const Triple &TT) {
  
  /// X86TargetMachine ctor - Create an X86 target.
  ///
-X86TargetMachine::X86TargetMachine(const Target &T, StringRef TT, StringRef CPU,
-                                   StringRef FS, const TargetOptions &Options,
+X86TargetMachine::X86TargetMachine(const Target &T, const Triple &TT,
+                                   StringRef CPU, StringRef FS,
+                                   const TargetOptions &Options,
                                     Reloc::Model RM, CodeModel::Model CM,
                                     CodeGenOpt::Level OL)
-    : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL),
-      TLOF(createTLOF(Triple(getTargetTriple()))),
-      DL(computeDataLayout(Triple(TT))),
+    : LLVMTargetMachine(T, computeDataLayout(TT), TT, CPU, FS, Options, RM, CM,
+                        OL),
+      TLOF(createTLOF(getTargetTriple())),
        Subtarget(TT, CPU, FS, *this, Options.StackAlignmentOverride) {
-  // default to hard float ABI
-  if (Options.FloatABIType == FloatABI::Default)
-    this->Options.FloatABIType = FloatABI::Hard;
-
    // Windows stack unwinder gets confused when execution flow "falls through"
    // after a call to 'noreturn' function.
    // To prevent that, we emit a trap for 'unreachable' IR instructions.
@@ -108,6 +117,16 @@ X86TargetMachine::X86TargetMachine(const Target &T, StringRef TT, StringRef CPU,
    if (Subtarget.isTargetWin64())
      this->Options.TrapUnreachable = true;
  
+  // By default (and when -ffast-math is on), enable estimate codegen for
+  // everything except scalar division. By default, use 1 refinement step for
+  // all operations. Defaults may be overridden by using command-line options.
+  // Scalar division estimates are disabled because they break too much
+  // real-world code. These defaults match GCC behavior.
+  this->Options.Reciprocals.setDefaults("sqrtf", true, 1);
+  this->Options.Reciprocals.setDefaults("divf", false, 1);
+  this->Options.Reciprocals.setDefaults("vec-sqrtf", true, 1);
+  this->Options.Reciprocals.setDefaults("vec-divf", true, 1);
+
    initAsmInfo();
  }
  
@@ -115,11 +134,8 @@ X86TargetMachine::~X86TargetMachine() {}
  
  const X86Subtarget *
  X86TargetMachine::getSubtargetImpl(const Function &F) const {
-  AttributeSet FnAttrs = F.getAttributes();
-  Attribute CPUAttr =
-      FnAttrs.getAttribute(AttributeSet::FunctionIndex, "target-cpu");
-  Attribute FSAttr =
-      FnAttrs.getAttribute(AttributeSet::FunctionIndex, "target-features");
+  Attribute CPUAttr = F.getFnAttribute("target-cpu");
+  Attribute FSAttr = F.getFnAttribute("target-features");
  
    std::string CPU = !CPUAttr.hasAttribute(Attribute::None)
                          ? CPUAttr.getValueAsString().str()
@@ -133,14 +149,15 @@ X86TargetMachine::getSubtargetImpl(const Function &F) const {
    // function before we can generate a subtarget. We also need to use
    // it as a key for the subtarget since that can be the only difference
    // between two functions.
-  Attribute SFAttr =
-      FnAttrs.getAttribute(AttributeSet::FunctionIndex, "use-soft-float");
-  bool SoftFloat = !SFAttr.hasAttribute(Attribute::None)
-                       ? SFAttr.getValueAsString() == "true"
-                       : Options.UseSoftFloat;
-
-  auto &I = SubtargetMap[CPU + FS + (SoftFloat ? "use-soft-float=true"
-                                               : "use-soft-float=false")];
+  bool SoftFloat =
+      F.hasFnAttribute("use-soft-float") &&
+      F.getFnAttribute("use-soft-float").getValueAsString() == "true";
+  // If the soft float attribute is set on the function turn on the soft float
+  // subtarget feature.
+  if (SoftFloat)
+    FS += FS.empty() ? "+soft-float" : ",+soft-float";
+
+  auto &I = SubtargetMap[CPU + FS];
    if (!I) {
      // This needs to be done before we create a new subtarget since any
      // creation will depend on the TM and the code generation flags on the
@@ -161,15 +178,13 @@ UseVZeroUpper("x86-use-vzeroupper", cl::Hidden,
    cl::init(true));
  
  //===----------------------------------------------------------------------===//
-// X86 Analysis Pass Setup
+// X86 TTI query.
  //===----------------------------------------------------------------------===//
  
-void X86TargetMachine::addAnalysisPasses(PassManagerBase &PM) {
-  // Add first the target-independent BasicTTI pass, then our X86 pass. This
-  // allows the X86 pass to delegate to the target independent layer when
-  // appropriate.
-  PM.add(createBasicTargetTransformInfoPass(this));
-  PM.add(createX86TargetTransformInfoPass(this));
+TargetIRAnalysis X86TargetMachine::getTargetIRAnalysis() {
+  return TargetIRAnalysis([this](const Function &F) {
+    return TargetTransformInfo(X86TTIImpl(this, F));
+  });
  }
  
  
@@ -188,15 +203,14 @@ public:
      return getTM<X86TargetMachine>();
    }
  
-  const X86Subtarget &getX86Subtarget() const {
-    return *getX86TargetMachine().getSubtargetImpl();
-  }
-
    void addIRPasses() override;
    bool addInstSelector() override;
    bool addILPOpts() override;
+  bool addPreISel() override;
+  void addPreRegAlloc() override;
    void addPostRegAlloc() override;
    void addPreEmitPass() override;
+  void addPreSched2() override;
  };
  } // namespace
  
@@ -215,7 +229,8 @@ bool X86PassConfig::addInstSelector() {
    addPass(createX86ISelDag(getX86TargetMachine(), getOptLevel()));
  
    // For ELF, cleanup any local-dynamic TLS accesses.
-  if (getX86Subtarget().isTargetELF() && getOptLevel() != CodeGenOpt::None)
+  if (TM->getTargetTriple().isOSBinFormatELF() &&
+      getOptLevel() != CodeGenOpt::None)
      addPass(createCleanupLocalDynamicTLSPass());
  
    addPass(createX86GlobalBaseRegPass());
@@ -225,15 +240,31 @@ bool X86PassConfig::addInstSelector() {
  
  bool X86PassConfig::addILPOpts() {
    addPass(&EarlyIfConverterID);
+  if (EnableMachineCombinerPass)
+    addPass(&MachineCombinerID);
+  return true;
+}
+
+bool X86PassConfig::addPreISel() {
+  // Only add this pass for 32-bit x86 Windows.
+  const Triple &TT = TM->getTargetTriple();
+  if (TT.isOSWindows() && TT.getArch() == Triple::x86)
+    addPass(createX86WinEHStatePass());
    return true;
  }
  
+void X86PassConfig::addPreRegAlloc() {
+  addPass(createX86CallFrameOptimization());
+}
+
  void X86PassConfig::addPostRegAlloc() {
    addPass(createX86FloatingPointStackifierPass());
  }
  
+void X86PassConfig::addPreSched2() { addPass(createX86ExpandPseudoPass()); }
+
  void X86PassConfig::addPreEmitPass() {
-  if (getOptLevel() != CodeGenOpt::None && getX86Subtarget().hasSSE2())
+  if (getOptLevel() != CodeGenOpt::None)
      addPass(createExecutionDependencyFixPass(&X86::VR128RegClass));
  
    if (UseVZeroUpper)