ARM let processInstruction() tranforms chain.

[oota-llvm.git] / lib / Target / ARM / ARMFastISel.cpp
diff --git a/lib/Target/ARM/ARMFastISel.cpp b/lib/Target/ARM/ARMFastISel.cpp

index a315c305fca7270987c11ce09fb51c5aedcf1ad7..6b2c1f32d23447753fe63c9c454016bf7db5a545 100644 (file)
--- a/lib/Target/ARM/ARMFastISel.cpp
+++ b/lib/Target/ARM/ARMFastISel.cpp
@@ -90,7 +90,7 @@ class ARMFastISel : public FastISel {
    ARMFunctionInfo *AFI;
  
    // Convenience variables to avoid some queries.
-  bool isThumb;
+  bool isThumb2;
    LLVMContext *Context;
  
    public:
@@ -101,7 +101,7 @@ class ARMFastISel : public FastISel {
        TLI(*TM.getTargetLowering()) {
        Subtarget = &TM.getSubtarget<ARMSubtarget>();
        AFI = funcInfo.MF->getInfo<ARMFunctionInfo>();
-      isThumb = AFI->isThumbFunction();
+      isThumb2 = AFI->isThumbFunction();
        Context = &funcInfo.Fn->getContext();
      }
  
@@ -552,11 +552,12 @@ unsigned ARMFastISel::ARMMaterializeInt(const Constant *C, EVT VT) {
    // do so now.
    const ConstantInt *CI = cast<ConstantInt>(C);
    if (Subtarget->hasV6T2Ops() && isUInt<16>(CI->getZExtValue())) {
-    unsigned Opc = isThumb ? ARM::t2MOVi16 : ARM::MOVi16;
-    unsigned ImmReg = createResultReg(TLI.getRegClassFor(VT));
+    EVT SrcVT = MVT::i32;
+    unsigned Opc = isThumb2 ? ARM::t2MOVi16 : ARM::MOVi16;
+    unsigned ImmReg = createResultReg(TLI.getRegClassFor(SrcVT));
      AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                              TII.get(Opc), ImmReg)
-                    .addImm(CI->getSExtValue()));
+                    .addImm(CI->getZExtValue()));
      return ImmReg;
    }
  
@@ -574,7 +575,7 @@ unsigned ARMFastISel::ARMMaterializeInt(const Constant *C, EVT VT) {
    }
    unsigned Idx = MCP.getConstantPoolIndex(C, Align);
  
-  if (isThumb)
+  if (isThumb2)
      AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                              TII.get(ARM::t2LDRpci), DestReg)
                      .addConstantPoolIndex(Idx));
@@ -595,7 +596,7 @@ unsigned ARMFastISel::ARMMaterializeGV(const GlobalValue *GV, EVT VT) {
    Reloc::Model RelocM = TM.getRelocationModel();
  
    // TODO: Need more magic for ARM PIC.
-  if (!isThumb && (RelocM == Reloc::PIC_)) return 0;
+  if (!isThumb2 && (RelocM == Reloc::PIC_)) return 0;
  
    // MachineConstantPool wants an explicit alignment.
    unsigned Align = TD.getPrefTypeAlignment(GV->getType());
@@ -615,7 +616,7 @@ unsigned ARMFastISel::ARMMaterializeGV(const GlobalValue *GV, EVT VT) {
    // Load value.
    MachineInstrBuilder MIB;
    unsigned DestReg = createResultReg(TLI.getRegClassFor(VT));
-  if (isThumb) {
+  if (isThumb2) {
      unsigned Opc = (RelocM != Reloc::PIC_) ? ARM::t2LDRpci : ARM::t2LDRpci_pic;
      MIB = BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(Opc), DestReg)
            .addConstantPoolIndex(Idx);
@@ -632,7 +633,7 @@ unsigned ARMFastISel::ARMMaterializeGV(const GlobalValue *GV, EVT VT) {
  
    if (Subtarget->GVIsIndirectSymbol(GV, RelocM)) {
      unsigned NewDestReg = createResultReg(TLI.getRegClassFor(VT));
-    if (isThumb)
+    if (isThumb2)
        MIB = BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                      TII.get(ARM::t2LDRi12), NewDestReg)
              .addReg(DestReg)
@@ -680,7 +681,7 @@ unsigned ARMFastISel::TargetMaterializeAlloca(const AllocaInst *AI) {
    if (SI != FuncInfo.StaticAllocaMap.end()) {
      TargetRegisterClass* RC = TLI.getRegClassFor(VT);
      unsigned ResultReg = createResultReg(RC);
-    unsigned Opc = isThumb ? ARM::t2ADDri : ARM::ADDri;
+    unsigned Opc = isThumb2 ? ARM::t2ADDri : ARM::ADDri;
      AddOptionalDefs(BuildMI(*FuncInfo.MBB, *FuncInfo.InsertPt, DL,
                              TII.get(Opc), ResultReg)
                              .addFrameIndex(SI->second)
@@ -845,9 +846,18 @@ void ARMFastISel::ARMSimplifyAddress(Address &Addr, EVT VT) {
    switch (VT.getSimpleVT().SimpleTy) {
      default:
        assert(false && "Unhandled load/store type!");
+    case MVT::i16:
+      if (isThumb2)
+        // Integer loads/stores handle 12-bit offsets.
+        needsLowering = ((Addr.Offset & 0xfff) != Addr.Offset);
+      else
+        // ARM i16 integer loads/stores handle +/-imm8 offsets.
+        // FIXME: Negative offsets require special handling.
+        if (Addr.Offset > 255 || Addr.Offset < 0)
+          needsLowering = true;
+      break;
      case MVT::i1:
      case MVT::i8:
-    case MVT::i16:
      case MVT::i32:
        // Integer loads/stores handle 12-bit offsets.
        needsLowering = ((Addr.Offset & 0xfff) != Addr.Offset);
@@ -863,10 +873,10 @@ void ARMFastISel::ARMSimplifyAddress(Address &Addr, EVT VT) {
    // put the alloca address into a register, set the base type back to
    // register and continue. This should almost never happen.
    if (needsLowering && Addr.BaseType == Address::FrameIndexBase) {
-    TargetRegisterClass *RC = isThumb ? ARM::tGPRRegisterClass :
+    TargetRegisterClass *RC = isThumb2 ? ARM::tGPRRegisterClass :
                                ARM::GPRRegisterClass;
      unsigned ResultReg = createResultReg(RC);
-    unsigned Opc = isThumb ? ARM::t2ADDri : ARM::ADDri;
+    unsigned Opc = isThumb2 ? ARM::t2ADDri : ARM::ADDri;
      AddOptionalDefs(BuildMI(*FuncInfo.MBB, *FuncInfo.InsertPt, DL,
                              TII.get(Opc), ResultReg)
                              .addFrameIndex(Addr.Base.FI)
@@ -907,7 +917,7 @@ void ARMFastISel::AddLoadStoreOperands(EVT VT, Address &Addr,
      MIB.addFrameIndex(FI);
  
      // ARM halfword load/stores need an additional operand.
-    if (!isThumb && VT.getSimpleVT().SimpleTy == MVT::i16) MIB.addReg(0);
+    if (!isThumb2 && VT.getSimpleVT().SimpleTy == MVT::i16) MIB.addReg(0);
  
      MIB.addImm(Addr.Offset);
      MIB.addMemOperand(MMO);
@@ -916,7 +926,7 @@ void ARMFastISel::AddLoadStoreOperands(EVT VT, Address &Addr,
      MIB.addReg(Addr.Base.Reg);
  
      // ARM halfword load/stores need an additional operand.
-    if (!isThumb && VT.getSimpleVT().SimpleTy == MVT::i16) MIB.addReg(0);
+    if (!isThumb2 && VT.getSimpleVT().SimpleTy == MVT::i16) MIB.addReg(0);
  
      MIB.addImm(Addr.Offset);
    }
@@ -931,16 +941,16 @@ bool ARMFastISel::ARMEmitLoad(EVT VT, unsigned &ResultReg, Address &Addr) {
    switch (VT.getSimpleVT().SimpleTy) {
      // This is mostly going to be Neon/vector support.
      default: return false;
-    case MVT::i16:
-      Opc = isThumb ? ARM::t2LDRHi12 : ARM::LDRH;
+    case MVT::i8:
+      Opc = isThumb2 ? ARM::t2LDRBi12 : ARM::LDRBi12;
        RC = ARM::GPRRegisterClass;
        break;
-    case MVT::i8:
-      Opc = isThumb ? ARM::t2LDRBi12 : ARM::LDRBi12;
+    case MVT::i16:
+      Opc = isThumb2 ? ARM::t2LDRHi12 : ARM::LDRH;
        RC = ARM::GPRRegisterClass;
        break;
      case MVT::i32:
-      Opc = isThumb ? ARM::t2LDRi12 : ARM::LDRi12;
+      Opc = isThumb2 ? ARM::t2LDRi12 : ARM::LDRi12;
        RC = ARM::GPRRegisterClass;
        break;
      case MVT::f32:
@@ -989,22 +999,22 @@ bool ARMFastISel::ARMEmitStore(EVT VT, unsigned SrcReg, Address &Addr) {
      // This is mostly going to be Neon/vector support.
      default: return false;
      case MVT::i1: {
-      unsigned Res = createResultReg(isThumb ? ARM::tGPRRegisterClass :
+      unsigned Res = createResultReg(isThumb2 ? ARM::tGPRRegisterClass :
                                                 ARM::GPRRegisterClass);
-      unsigned Opc = isThumb ? ARM::t2ANDri : ARM::ANDri;
+      unsigned Opc = isThumb2 ? ARM::t2ANDri : ARM::ANDri;
        AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                                TII.get(Opc), Res)
                        .addReg(SrcReg).addImm(1));
        SrcReg = Res;
      } // Fallthrough here.
      case MVT::i8:
-      StrOpc = isThumb ? ARM::t2STRBi12 : ARM::STRBi12;
+      StrOpc = isThumb2 ? ARM::t2STRBi12 : ARM::STRBi12;
        break;
      case MVT::i16:
-      StrOpc = isThumb ? ARM::t2STRHi12 : ARM::STRH;
+      StrOpc = isThumb2 ? ARM::t2STRHi12 : ARM::STRH;
        break;
      case MVT::i32:
-      StrOpc = isThumb ? ARM::t2STRi12 : ARM::STRi12;
+      StrOpc = isThumb2 ? ARM::t2STRi12 : ARM::STRi12;
        break;
      case MVT::f32:
        if (!Subtarget->hasVFP2()) return false;
@@ -1128,7 +1138,7 @@ bool ARMFastISel::SelectBranch(const Instruction *I) {
        if (!ARMEmitCmp(CI->getOperand(0), CI->getOperand(1), CI->isUnsigned()))
          return false;
  
-      unsigned BrOpc = isThumb ? ARM::t2Bcc : ARM::Bcc;
+      unsigned BrOpc = isThumb2 ? ARM::t2Bcc : ARM::Bcc;
        BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(BrOpc))
        .addMBB(TBB).addImm(ARMPred).addReg(ARM::CPSR);
        FastEmitBranch(FBB, DL);
@@ -1139,7 +1149,7 @@ bool ARMFastISel::SelectBranch(const Instruction *I) {
      MVT SourceVT;
      if (TI->hasOneUse() && TI->getParent() == I->getParent() &&
          (isLoadTypeLegal(TI->getOperand(0)->getType(), SourceVT))) {
-      unsigned TstOpc = isThumb ? ARM::t2TSTri : ARM::TSTri;
+      unsigned TstOpc = isThumb2 ? ARM::t2TSTri : ARM::TSTri;
        unsigned OpReg = getRegForValue(TI->getOperand(0));
        AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                                TII.get(TstOpc))
@@ -1151,7 +1161,7 @@ bool ARMFastISel::SelectBranch(const Instruction *I) {
          CCMode = ARMCC::EQ;
        }
  
-      unsigned BrOpc = isThumb ? ARM::t2Bcc : ARM::Bcc;
+      unsigned BrOpc = isThumb2 ? ARM::t2Bcc : ARM::Bcc;
        BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(BrOpc))
        .addMBB(TBB).addImm(CCMode).addReg(ARM::CPSR);
  
@@ -1177,7 +1187,7 @@ bool ARMFastISel::SelectBranch(const Instruction *I) {
    // Regardless, the compare has been done in the predecessor block,
    // and it left a value for us in a virtual register.  Ergo, we test
    // the one-bit value left in the virtual register.
-  unsigned TstOpc = isThumb ? ARM::t2TSTri : ARM::TSTri;
+  unsigned TstOpc = isThumb2 ? ARM::t2TSTri : ARM::TSTri;
    AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(TstOpc))
                    .addReg(CmpReg).addImm(1));
  
@@ -1187,7 +1197,7 @@ bool ARMFastISel::SelectBranch(const Instruction *I) {
      CCMode = ARMCC::EQ;
    }
  
-  unsigned BrOpc = isThumb ? ARM::t2Bcc : ARM::Bcc;
+  unsigned BrOpc = isThumb2 ? ARM::t2Bcc : ARM::Bcc;
    BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(BrOpc))
                    .addMBB(TBB).addImm(CCMode).addReg(ARM::CPSR);
    FastEmitBranch(FBB, DL);
@@ -1205,16 +1215,42 @@ bool ARMFastISel::ARMEmitCmp(const Value *Src1Value, const Value *Src2Value,
    if (isFloat && !Subtarget->hasVFP2())
      return false;
  
+  // Check to see if the 2nd operand is a constant that we can encode directly
+  // in the compare.
+  int EncodedImm = 0;
+  bool EncodeImm = false;
+  bool isNegativeImm = false;
+  if (const ConstantInt *ConstInt = dyn_cast<ConstantInt>(Src2Value)) {
+    if (SrcVT == MVT::i32 || SrcVT == MVT::i16 || SrcVT == MVT::i8 ||
+        SrcVT == MVT::i1) {
+      const APInt &CIVal = ConstInt->getValue();
+      EncodedImm = (isZExt) ? (int)CIVal.getZExtValue() : (int)CIVal.getSExtValue();
+      if (EncodedImm < 0) {
+        isNegativeImm = true;
+        EncodedImm = -EncodedImm;
+      }
+      EncodeImm = isThumb2 ? (ARM_AM::getT2SOImmVal(EncodedImm) != -1) :
+        (ARM_AM::getSOImmVal(EncodedImm) != -1);
+    }
+  } else if (const ConstantFP *ConstFP = dyn_cast<ConstantFP>(Src2Value)) {
+    if (SrcVT == MVT::f32 || SrcVT == MVT::f64)
+      if (ConstFP->isZero() && !ConstFP->isNegative())
+        EncodeImm = true;
+  }
+
    unsigned CmpOpc;
+  bool isICmp = true;
    bool needsExt = false;
    switch (SrcVT.getSimpleVT().SimpleTy) {
      default: return false;
      // TODO: Verify compares.
      case MVT::f32:
-      CmpOpc = ARM::VCMPES;
+      isICmp = false;
+      CmpOpc = EncodeImm ? ARM::VCMPEZS : ARM::VCMPES;
        break;
      case MVT::f64:
-      CmpOpc = ARM::VCMPED;
+      isICmp = false;
+      CmpOpc = EncodeImm ? ARM::VCMPEZD : ARM::VCMPED;
        break;
      case MVT::i1:
      case MVT::i8:
@@ -1222,30 +1258,56 @@ bool ARMFastISel::ARMEmitCmp(const Value *Src1Value, const Value *Src2Value,
        needsExt = true;
      // Intentional fall-through.
      case MVT::i32:
-      CmpOpc = isThumb ? ARM::t2CMPrr : ARM::CMPrr;
+      if (isThumb2) {
+        if (!EncodeImm)
+          CmpOpc = ARM::t2CMPrr;
+        else
+          CmpOpc = isNegativeImm ? ARM::t2CMNzri : ARM::t2CMPri;
+      } else {
+        if (!EncodeImm)
+          CmpOpc = ARM::CMPrr;
+        else
+          CmpOpc = isNegativeImm ? ARM::CMNzri : ARM::CMPri;
+      }
        break;
    }
  
    unsigned SrcReg1 = getRegForValue(Src1Value);
    if (SrcReg1 == 0) return false;
  
-  unsigned SrcReg2 = getRegForValue(Src2Value);
-  if (SrcReg2 == 0) return false;
+  unsigned SrcReg2;
+  if (!EncodeImm) {
+    SrcReg2 = getRegForValue(Src2Value);
+    if (SrcReg2 == 0) return false;
+  }
  
    // We have i1, i8, or i16, we need to either zero extend or sign extend.
    if (needsExt) {
      unsigned ResultReg;
-    EVT DestVT = MVT::i32;
-    ResultReg = ARMEmitIntExt(SrcVT, SrcReg1, DestVT, isZExt);
+    ResultReg = ARMEmitIntExt(SrcVT, SrcReg1, MVT::i32, isZExt);
      if (ResultReg == 0) return false;
      SrcReg1 = ResultReg;
-    ResultReg = ARMEmitIntExt(SrcVT, SrcReg2, DestVT, isZExt);
-    if (ResultReg == 0) return false;
-    SrcReg2 = ResultReg;
+    if (!EncodeImm) {
+      ResultReg = ARMEmitIntExt(SrcVT, SrcReg2, MVT::i32, isZExt);
+      if (ResultReg == 0) return false;
+      SrcReg2 = ResultReg;
+    }
    }
  
-  AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(CmpOpc))
-                  .addReg(SrcReg1).addReg(SrcReg2));
+  if (!EncodeImm) {
+    AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
+                            TII.get(CmpOpc))
+                    .addReg(SrcReg1).addReg(SrcReg2));
+  } else {
+    MachineInstrBuilder MIB;
+    MIB = BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(CmpOpc))
+      .addReg(SrcReg1);
+
+    // Only add immediate for icmp as the immediate for fcmp is an implicit 0.0.
+    if (isICmp)
+      MIB.addImm(EncodedImm);
+    AddOptionalDefs(MIB);
+  }
  
    // For floating point we need to move the result to a comparison register
    // that we can then use for branches.
@@ -1271,8 +1333,8 @@ bool ARMFastISel::SelectCmp(const Instruction *I) {
  
    // Now set a register based on the comparison. Explicitly set the predicates
    // here.
-  unsigned MovCCOpc = isThumb ? ARM::t2MOVCCi : ARM::MOVCCi;
-  TargetRegisterClass *RC = isThumb ? ARM::rGPRRegisterClass
+  unsigned MovCCOpc = isThumb2 ? ARM::t2MOVCCi : ARM::MOVCCi;
+  TargetRegisterClass *RC = isThumb2 ? ARM::rGPRRegisterClass
                                      : ARM::GPRRegisterClass;
    unsigned DestReg = createResultReg(RC);
    Constant *Zero = ConstantInt::get(Type::getInt32Ty(*Context), 0);
@@ -1417,11 +1479,11 @@ bool ARMFastISel::SelectSelect(const Instruction *I) {
    unsigned Op2Reg = getRegForValue(I->getOperand(2));
    if (Op2Reg == 0) return false;
  
-  unsigned CmpOpc = isThumb ? ARM::t2TSTri : ARM::TSTri;
+  unsigned CmpOpc = isThumb2 ? ARM::t2TSTri : ARM::TSTri;
    AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(CmpOpc))
                    .addReg(CondReg).addImm(1));
    unsigned ResultReg = createResultReg(RC);
-  unsigned MovCCOpc = isThumb ? ARM::t2MOVCCr : ARM::MOVCCr;
+  unsigned MovCCOpc = isThumb2 ? ARM::t2MOVCCr : ARM::MOVCCr;
    BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(MovCCOpc), ResultReg)
      .addReg(Op1Reg).addReg(Op2Reg)
      .addImm(ARMCC::EQ).addReg(ARM::CPSR);
@@ -1598,33 +1660,21 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
      switch (VA.getLocInfo()) {
        case CCValAssign::Full: break;
        case CCValAssign::SExt: {
-        bool Emitted = FastEmitExtend(ISD::SIGN_EXTEND, VA.getLocVT(),
-                                         Arg, ArgVT, Arg);
-        assert(Emitted && "Failed to emit a sext!"); (void)Emitted;
-        Emitted = true;
-        ArgVT = VA.getLocVT();
+        EVT DestVT = VA.getLocVT();
+        unsigned ResultReg = ARMEmitIntExt(ArgVT, Arg, DestVT,
+                                           /*isZExt*/false);
+        assert (ResultReg != 0 && "Failed to emit a sext");
+        Arg = ResultReg;
          break;
        }
+      case CCValAssign::AExt:
+        // Intentional fall-through.  Handle AExt and ZExt.
        case CCValAssign::ZExt: {
-        bool Emitted = FastEmitExtend(ISD::ZERO_EXTEND, VA.getLocVT(),
-                                         Arg, ArgVT, Arg);
-        assert(Emitted && "Failed to emit a zext!"); (void)Emitted;
-        Emitted = true;
-        ArgVT = VA.getLocVT();
-        break;
-      }
-      case CCValAssign::AExt: {
-        bool Emitted = FastEmitExtend(ISD::ANY_EXTEND, VA.getLocVT(),
-                                         Arg, ArgVT, Arg);
-        if (!Emitted)
-          Emitted = FastEmitExtend(ISD::ZERO_EXTEND, VA.getLocVT(),
-                                      Arg, ArgVT, Arg);
-        if (!Emitted)
-          Emitted = FastEmitExtend(ISD::SIGN_EXTEND, VA.getLocVT(),
-                                      Arg, ArgVT, Arg);
-
-        assert(Emitted && "Failed to emit a aext!"); (void)Emitted;
-        ArgVT = VA.getLocVT();
+        EVT DestVT = VA.getLocVT();
+        unsigned ResultReg = ARMEmitIntExt(ArgVT, Arg, DestVT,
+                                           /*isZExt*/true);
+        assert (ResultReg != 0 && "Failed to emit a sext");
+        Arg = ResultReg;
          break;
        }
        case CCValAssign::BCvt: {
@@ -1642,7 +1692,7 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
      if (VA.isRegLoc() && !VA.needsCustom()) {
        BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(TargetOpcode::COPY),
                VA.getLocReg())
-      .addReg(Arg);
+        .addReg(Arg);
        RegArgs.push_back(VA.getLocReg());
      } else if (VA.needsCustom()) {
        // TODO: We need custom lowering for vector (v2f64) args.
@@ -1708,6 +1758,11 @@ bool ARMFastISel::FinishCall(MVT RetVT, SmallVectorImpl<unsigned> &UsedRegs,
      } else {
        assert(RVLocs.size() == 1 &&"Can't handle non-double multi-reg retvals!");
        EVT CopyVT = RVLocs[0].getValVT();
+
+      // Special handling for extended integers.
+      if (RetVT == MVT::i1 || RetVT == MVT::i8 || RetVT == MVT::i16)
+        CopyVT = MVT::i32;
+
        TargetRegisterClass* DstRC = TLI.getRegClassFor(CopyVT);
  
        unsigned ResultReg = createResultReg(DstRC);
@@ -1794,7 +1849,7 @@ bool ARMFastISel::SelectRet(const Instruction *I) {
      MRI.addLiveOut(VA.getLocReg());
    }
  
-  unsigned RetOpc = isThumb ? ARM::tBX_RET : ARM::BX_RET;
+  unsigned RetOpc = isThumb2 ? ARM::tBX_RET : ARM::BX_RET;
    AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                            TII.get(RetOpc)));
    return true;
@@ -1804,7 +1859,7 @@ unsigned ARMFastISel::ARMSelectCallOp(const GlobalValue *GV) {
  
    // Darwin needs the r9 versions of the opcodes.
    bool isDarwin = Subtarget->isTargetDarwin();
-  if (isThumb) {
+  if (isThumb2) {
      return isDarwin ? ARM::tBLr9 : ARM::tBL;
    } else  {
      return isDarwin ? ARM::BLr9 : ARM::BL;
@@ -1870,7 +1925,7 @@ bool ARMFastISel::ARMEmitLibcall(const Instruction *I, RTLIB::Libcall Call) {
    // TODO: Turn this into the table of arm call ops.
    MachineInstrBuilder MIB;
    unsigned CallOpc = ARMSelectCallOp(NULL);
-  if(isThumb)
+  if(isThumb2)
      // Explicitly adding the predicate here.
      MIB = AddDefaultPred(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                           TII.get(CallOpc)))
@@ -1924,7 +1979,8 @@ bool ARMFastISel::SelectCall(const Instruction *I) {
    MVT RetVT;
    if (RetTy->isVoidTy())
      RetVT = MVT::isVoid;
-  else if (!isTypeLegal(RetTy, RetVT))
+  else if (!isTypeLegal(RetTy, RetVT) && RetVT != MVT::i16 &&
+           RetVT != MVT::i8  && RetVT != MVT::i1)
      return false;
  
    // TODO: For now if we have long calls specified we don't handle the call.
@@ -1961,8 +2017,8 @@ bool ARMFastISel::SelectCall(const Instruction *I) {
  
      Type *ArgTy = (*i)->getType();
      MVT ArgVT;
-    // FIXME: Should be able to handle i1, i8, and/or i16 parameters.
-    if (!isTypeLegal(ArgTy, ArgVT))
+    if (!isTypeLegal(ArgTy, ArgVT) && ArgVT != MVT::i16 && ArgVT != MVT::i8 &&
+        ArgVT != MVT::i1)
        return false;
      unsigned OriginalAlignment = TD.getABITypeAlignment(ArgTy);
      Flags.setOrigAlign(OriginalAlignment);
@@ -1984,7 +2040,7 @@ bool ARMFastISel::SelectCall(const Instruction *I) {
    MachineInstrBuilder MIB;
    unsigned CallOpc = ARMSelectCallOp(GV);
    // Explicitly adding the predicate here.
-  if(isThumb)
+  if(isThumb2)
      // Explicitly adding the predicate here.
      MIB = AddDefaultPred(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                           TII.get(CallOpc)))
@@ -2045,20 +2101,20 @@ unsigned ARMFastISel::ARMEmitIntExt(EVT SrcVT, unsigned SrcReg, EVT DestVT,
    case MVT::i16:
      if (!Subtarget->hasV6Ops()) return 0;
      if (isZExt)
-      Opc = isThumb ? ARM::t2UXTH : ARM::UXTH;
+      Opc = isThumb2 ? ARM::t2UXTH : ARM::UXTH;
      else
-      Opc = isThumb ? ARM::t2SXTH : ARM::SXTH;
+      Opc = isThumb2 ? ARM::t2SXTH : ARM::SXTH;
      break;
    case MVT::i8:
      if (!Subtarget->hasV6Ops()) return 0;
      if (isZExt)
-      Opc = isThumb ? ARM::t2UXTB : ARM::UXTB;
+      Opc = isThumb2 ? ARM::t2UXTB : ARM::UXTB;
      else
-      Opc = isThumb ? ARM::t2SXTB : ARM::SXTB;
+      Opc = isThumb2 ? ARM::t2SXTB : ARM::SXTB;
      break;
    case MVT::i1:
      if (isZExt) {
-      Opc = isThumb ? ARM::t2ANDri : ARM::ANDri;
+      Opc = isThumb2 ? ARM::t2ANDri : ARM::ANDri;
        isBoolZext = true;
        break;
      }