[AArch64][FastISel] Fix the setting of kill flags for MUL -> UMULH sequences.

[oota-llvm.git] / lib / Target / AArch64 / AArch64TargetTransformInfo.cpp
diff --git a/lib/Target/AArch64/AArch64TargetTransformInfo.cpp b/lib/Target/AArch64/AArch64TargetTransformInfo.cpp

index eab080bb24c38d1a44b377096ef99a6672167155..0533355b01dec0910c7469e3e0768e0919950d4b 100644 (file)
--- a/lib/Target/AArch64/AArch64TargetTransformInfo.cpp
+++ b/lib/Target/AArch64/AArch64TargetTransformInfo.cpp
@@ -10,6 +10,7 @@
  #include "AArch64TargetTransformInfo.h"
  #include "MCTargetDesc/AArch64AddressingModes.h"
  #include "llvm/Analysis/TargetTransformInfo.h"
+#include "llvm/Analysis/LoopInfo.h"
  #include "llvm/CodeGen/BasicTTIImpl.h"
  #include "llvm/Support/Debug.h"
  #include "llvm/Target/CostTable.h"
@@ -352,7 +353,7 @@ unsigned AArch64TTIImpl::getCmpSelInstrCost(unsigned Opcode, Type *ValTy,
    // We don't lower vector selects well that are wider than the register width.
    if (ValTy->isVectorTy() && ISD == ISD::SELECT) {
      // We would need this many instructions to hide the scalarization happening.
-    unsigned AmortizationCost = 20;
+    const unsigned AmortizationCost = 20;
      static const TypeConversionCostTblEntry<MVT::SimpleValueType>
      VectorSelectTbl[] = {
        { ISD::SELECT, MVT::v16i1, MVT::v16i16, 16 * AmortizationCost },
@@ -424,8 +425,17 @@ unsigned AArch64TTIImpl::getMaxInterleaveFactor() {
    return 2;
  }
  
-void AArch64TTIImpl::getUnrollingPreferences(const Function *F, Loop *L,
+void AArch64TTIImpl::getUnrollingPreferences(Loop *L,
                                               TTI::UnrollingPreferences &UP) {
+  // Enable partial unrolling and runtime unrolling.
+  BaseT::getUnrollingPreferences(L, UP);
+
+  // For inner loop, it is more likely to be a hot one, and the runtime check
+  // can be promoted out from LICM pass, so the overhead is less, let's try
+  // a larger threshold to unroll more loops.
+  if (L->getLoopDepth() > 1)
+    UP.PartialThreshold *= 2;
+
    // Disable partial & runtime unrolling on -Os.
    UP.PartialOptSizeThreshold = 0;
  }