ARM64: diagnose use of v16-v31 in certain indexed NEON instructions.

[oota-llvm.git] / lib / Target / ARM64 / ARM64ISelLowering.cpp
diff --git a/lib/Target/ARM64/ARM64ISelLowering.cpp b/lib/Target/ARM64/ARM64ISelLowering.cpp

index 58e425938e137c9a01c2743fd3d2451460096a77..024bc7416885f7dfeb7dfd3428ff4eb2dda3e3cd 100644 (file)
--- a/lib/Target/ARM64/ARM64ISelLowering.cpp
+++ b/lib/Target/ARM64/ARM64ISelLowering.cpp
@@ -370,8 +370,6 @@ ARM64TargetLowering::ARM64TargetLowering(ARM64TargetMachine &TM)
  
    setMinFunctionAlignment(2);
  
-  setDivIsWellDefined(true);
-
    RequireStrictAlign = StrictAlign;
  
    setHasExtractBitsInsn(true);
@@ -437,6 +435,11 @@ ARM64TargetLowering::ARM64TargetLowering(ARM64TargetMachine &TM)
        setOperationAction(ISD::SIGN_EXTEND_INREG, (MVT::SimpleValueType)VT,
                           Expand);
  
+      setOperationAction(ISD::MULHS, (MVT::SimpleValueType)VT, Expand);
+      setOperationAction(ISD::SMUL_LOHI, (MVT::SimpleValueType)VT, Expand);
+      setOperationAction(ISD::MULHU, (MVT::SimpleValueType)VT, Expand);
+      setOperationAction(ISD::UMUL_LOHI, (MVT::SimpleValueType)VT, Expand);
+
        for (unsigned InnerVT = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;
             InnerVT <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++InnerVT)
          setTruncStoreAction((MVT::SimpleValueType)VT,
@@ -619,7 +622,7 @@ ARM64TargetLowering::createFastISel(FunctionLoweringInfo &funcInfo,
  const char *ARM64TargetLowering::getTargetNodeName(unsigned Opcode) const {
    switch (Opcode) {
    default:
-    return 0;
+    return nullptr;
    case ARM64ISD::CALL:              return "ARM64ISD::CALL";
    case ARM64ISD::ADRP:              return "ARM64ISD::ADRP";
    case ARM64ISD::ADDlow:            return "ARM64ISD::ADDlow";
@@ -1418,8 +1421,7 @@ static SDValue LowerVectorINT_TO_FP(SDValue Op, SelectionDAG &DAG) {
      BuildVectorOps.push_back(Sclr);
    }
  
-  return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, &BuildVectorOps[0],
-                     BuildVectorOps.size());
+  return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, BuildVectorOps);
  }
  
  SDValue ARM64TargetLowering::LowerINT_TO_FP(SDValue Op,
@@ -1818,8 +1820,7 @@ void ARM64TargetLowering::saveVarArgRegisters(CCState &CCInfo,
    }
  
    if (!MemOps.empty()) {
-    Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, &MemOps[0],
-                        MemOps.size());
+    Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, MemOps);
    }
  }
  
@@ -2106,8 +2107,7 @@ SDValue ARM64TargetLowering::LowerCall(CallLoweringInfo &CLI,
    }
  
    if (!MemOpChains.empty())
-    Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, &MemOpChains[0],
-                        MemOpChains.size());
+    Chain = DAG.getNode(ISD::TokenFactor, DL, MVT::Other, MemOpChains);
  
    // Build a sequence of copy-to-reg nodes chained together with token chain
    // and flag operands which copy the outgoing args into the appropriate regs.
@@ -2183,10 +2183,10 @@ SDValue ARM64TargetLowering::LowerCall(CallLoweringInfo &CLI,
    // If we're doing a tall call, use a TC_RETURN here rather than an
    // actual call instruction.
    if (IsTailCall)
-    return DAG.getNode(ARM64ISD::TC_RETURN, DL, NodeTys, &Ops[0], Ops.size());
+    return DAG.getNode(ARM64ISD::TC_RETURN, DL, NodeTys, Ops);
  
    // Returns a chain and a flag for retval copy to use.
-  Chain = DAG.getNode(ARM64ISD::CALL, DL, NodeTys, &Ops[0], Ops.size());
+  Chain = DAG.getNode(ARM64ISD::CALL, DL, NodeTys, Ops);
    InFlag = Chain.getValue(1);
  
    Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumBytes, true),
@@ -2254,8 +2254,7 @@ ARM64TargetLowering::LowerReturn(SDValue Chain, CallingConv::ID CallConv,
    if (Flag.getNode())
      RetOps.push_back(Flag);
  
-  return DAG.getNode(ARM64ISD::RET_FLAG, DL, MVT::Other, &RetOps[0],
-                     RetOps.size());
+  return DAG.getNode(ARM64ISD::RET_FLAG, DL, MVT::Other, RetOps);
  }
  
  //===----------------------------------------------------------------------===//
@@ -2425,7 +2424,7 @@ SDValue ARM64TargetLowering::LowerELFTLSDescCall(SDValue SymAddr,
    Ops.push_back(Glue);
  
    SDVTList NodeTys = DAG.getVTList(MVT::Other, MVT::Glue);
-  Chain = DAG.getNode(ARM64ISD::TLSDESC_CALL, DL, NodeTys, &Ops[0], Ops.size());
+  Chain = DAG.getNode(ARM64ISD::TLSDESC_CALL, DL, NodeTys, Ops);
    Glue = Chain.getValue(1);
  
    return DAG.getCopyFromReg(Chain, DL, ARM64::X0, PtrVT, Glue);
@@ -2565,7 +2564,7 @@ SDValue ARM64TargetLowering::LowerBR_CC(SDValue Op, SelectionDAG &DAG) const {
  
      // If softenSetCCOperands returned a scalar, we need to compare the result
      // against zero to select between true and false values.
-    if (RHS.getNode() == 0) {
+    if (!RHS.getNode()) {
        RHS = DAG.getConstant(0, LHS.getValueType());
        CC = ISD::SETNE;
      }
@@ -2735,8 +2734,7 @@ SDValue ARM64TargetLowering::LowerFCOPYSIGN(SDValue Op,
    for (unsigned i = 0; i < VecVT.getVectorNumElements(); ++i)
      BuildVectorOps.push_back(EltMask);
  
-  SDValue BuildVec = DAG.getNode(ISD::BUILD_VECTOR, DL, VecVT,
-                                 &BuildVectorOps[0], BuildVectorOps.size());
+  SDValue BuildVec = DAG.getNode(ISD::BUILD_VECTOR, DL, VecVT, BuildVectorOps);
  
    // If we couldn't materialize the mask above, then the mask vector will be
    // the zero vector, and we need to negate it here.
@@ -2815,7 +2813,7 @@ SDValue ARM64TargetLowering::LowerSETCC(SDValue Op, SelectionDAG &DAG) const {
      softenSetCCOperands(DAG, MVT::f128, LHS, RHS, CC, dl);
  
      // If softenSetCCOperands returned a scalar, use it.
-    if (RHS.getNode() == 0) {
+    if (!RHS.getNode()) {
        assert(LHS.getValueType() == Op.getValueType() &&
               "Unexpected setcc expansion!");
        return LHS;
@@ -2939,7 +2937,7 @@ SDValue ARM64TargetLowering::LowerSELECT_CC(SDValue Op,
  
      // If softenSetCCOperands returned a scalar, we need to compare the result
      // against zero to select between true and false values.
-    if (RHS.getNode() == 0) {
+    if (!RHS.getNode()) {
        RHS = DAG.getConstant(0, LHS.getValueType());
        CC = ISD::SETNE;
      }
@@ -3273,8 +3271,7 @@ SDValue ARM64TargetLowering::LowerAAPCS_VASTART(SDValue Op,
                                  VROffsAddr, MachinePointerInfo(SV, 28), false,
                                  false, 4));
  
-  return DAG.getNode(ISD::TokenFactor, DL, MVT::Other, &MemOps[0],
-                     MemOps.size());
+  return DAG.getNode(ISD::TokenFactor, DL, MVT::Other, MemOps);
  }
  
  SDValue ARM64TargetLowering::LowerVASTART(SDValue Op, SelectionDAG &DAG) const {
@@ -3350,7 +3347,7 @@ SDValue ARM64TargetLowering::LowerVAARG(SDValue Op, SelectionDAG &DAG) const {
                                     DAG.getIntPtrConstant(1));
      SDValue Ops[] = { NarrowFP, WideFP.getValue(1) };
      // Merge the rounded value with the chain output of the load.
-    return DAG.getMergeValues(Ops, 2, DL);
+    return DAG.getMergeValues(Ops, DL);
    }
  
    return DAG.getLoad(VT, DL, APStore, VAList, MachinePointerInfo(), false,
@@ -3437,7 +3434,7 @@ SDValue ARM64TargetLowering::LowerShiftRightParts(SDValue Op,
        DAG.getNode(ARM64ISD::CSEL, dl, VT, TrueValHi, FalseValHi, CCVal, Cmp);
  
    SDValue Ops[2] = { Lo, Hi };
-  return DAG.getMergeValues(Ops, 2, dl);
+  return DAG.getMergeValues(Ops, dl);
  }
  
  /// LowerShiftLeftParts - Lower SHL_PARTS, which returns two
@@ -3477,7 +3474,7 @@ SDValue ARM64TargetLowering::LowerShiftLeftParts(SDValue Op,
        DAG.getNode(ARM64ISD::CSEL, dl, VT, TrueValLo, FalseValLo, CCVal, Cmp);
  
    SDValue Ops[2] = { Lo, Hi };
-  return DAG.getMergeValues(Ops, 2, dl);
+  return DAG.getMergeValues(Ops, dl);
  }
  
  bool
@@ -3563,7 +3560,7 @@ ARM64TargetLowering::getSingleConstraintMatchWeight(
    Value *CallOperandVal = info.CallOperandVal;
    // If we don't have a value, we can't do a match,
    // but allow it at the lowest weight.
-  if (CallOperandVal == NULL)
+  if (!CallOperandVal)
      return CW_Default;
    Type *type = CallOperandVal->getType();
    // Look at the constraint type.
@@ -3617,7 +3614,7 @@ ARM64TargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
    Res = TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);
  
    // Not found as a standard register?
-  if (Res.second == 0) {
+  if (!Res.second) {
      unsigned Size = Constraint.size();
      if ((Size == 4 || Size == 5) && Constraint[0] == '{' &&
          tolower(Constraint[1]) == 'v' && Constraint[Size - 1] == '}') {
@@ -3642,7 +3639,7 @@ ARM64TargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
  void ARM64TargetLowering::LowerAsmOperandForConstraint(
      SDValue Op, std::string &Constraint, std::vector<SDValue> &Ops,
      SelectionDAG &DAG) const {
-  SDValue Result(0, 0);
+  SDValue Result;
  
    // Currently only support length 1 constraints.
    if (Constraint.length() != 1)
@@ -4359,14 +4356,16 @@ static SDValue GenerateTBL(SDValue Op, ArrayRef<int> ShuffleMask,
      Shuffle = DAG.getNode(
          ISD::INTRINSIC_WO_CHAIN, DL, IndexVT,
          DAG.getConstant(Intrinsic::arm64_neon_tbl1, MVT::i32), V1Cst,
-        DAG.getNode(ISD::BUILD_VECTOR, DL, IndexVT, &TBLMask[0], IndexLen));
+        DAG.getNode(ISD::BUILD_VECTOR, DL, IndexVT,
+                    ArrayRef<SDValue>(TBLMask.data(), IndexLen)));
    } else {
      if (IndexLen == 8) {
        V1Cst = DAG.getNode(ISD::CONCAT_VECTORS, DL, MVT::v16i8, V1Cst, V2Cst);
        Shuffle = DAG.getNode(
            ISD::INTRINSIC_WO_CHAIN, DL, IndexVT,
            DAG.getConstant(Intrinsic::arm64_neon_tbl1, MVT::i32), V1Cst,
-          DAG.getNode(ISD::BUILD_VECTOR, DL, IndexVT, &TBLMask[0], IndexLen));
+          DAG.getNode(ISD::BUILD_VECTOR, DL, IndexVT,
+                      ArrayRef<SDValue>(TBLMask.data(), IndexLen)));
      } else {
        // FIXME: We cannot, for the moment, emit a TBL2 instruction because we
        // cannot currently represent the register constraints on the input
@@ -4377,7 +4376,8 @@ static SDValue GenerateTBL(SDValue Op, ArrayRef<int> ShuffleMask,
        Shuffle = DAG.getNode(
            ISD::INTRINSIC_WO_CHAIN, DL, IndexVT,
            DAG.getConstant(Intrinsic::arm64_neon_tbl2, MVT::i32), V1Cst, V2Cst,
-          DAG.getNode(ISD::BUILD_VECTOR, DL, IndexVT, &TBLMask[0], IndexLen));
+          DAG.getNode(ISD::BUILD_VECTOR, DL, IndexVT,
+                      ArrayRef<SDValue>(TBLMask.data(), IndexLen)));
      }
    }
    return DAG.getNode(ISD::BITCAST, DL, Op.getValueType(), Shuffle);
@@ -5160,7 +5160,7 @@ FailedModImm:
        for (unsigned i = 0; i < NumElts; ++i)
          Ops.push_back(DAG.getNode(ISD::BITCAST, dl, NewType, Op.getOperand(i)));
        EVT VecVT = EVT::getVectorVT(*DAG.getContext(), NewType, NumElts);
-      SDValue Val = DAG.getNode(ISD::BUILD_VECTOR, dl, VecVT, &Ops[0], NumElts);
+      SDValue Val = DAG.getNode(ISD::BUILD_VECTOR, dl, VecVT, Ops);
        Val = LowerBUILD_VECTOR(Val, DAG);
        if (Val.getNode())
          return DAG.getNode(ISD::BITCAST, dl, VT, Val);
@@ -5812,12 +5812,12 @@ EVT ARM64TargetLowering::getOptimalMemOpType(uint64_t Size, unsigned DstAlign,
    // addressing mode). Just do two i64 store of zero-registers.
    bool Fast;
    const Function *F = MF.getFunction();
-  if (!IsMemset && Size >= 16 &&
+  if (Subtarget->hasFPARMv8() && !IsMemset && Size >= 16 &&
        !F->getAttributes().hasAttribute(AttributeSet::FunctionIndex,
                                         Attribute::NoImplicitFloat) &&
        (memOpAlign(SrcAlign, DstAlign, 16) ||
-       (allowsUnalignedMemoryAccesses(MVT::v2i64, 0, &Fast) && Fast)))
-    return MVT::v2i64;
+       (allowsUnalignedMemoryAccesses(MVT::f128, 0, &Fast) && Fast)))
+    return MVT::f128;
  
    return Size >= 8 ? MVT::i64 : MVT::i32;
  }