[ARM] Prevent PerformVDIVCombine from combining a vcvt/vdiv with 8 lanes.

author Chad Rosier <mcrosier@codeaurora.org>

Wed, 7 Oct 2015 16:15:40 +0000 (16:15 +0000)

committer Chad Rosier <mcrosier@codeaurora.org>

Wed, 7 Oct 2015 16:15:40 +0000 (16:15 +0000)
author Chad Rosier <mcrosier@codeaurora.org>
Wed, 7 Oct 2015 16:15:40 +0000 (16:15 +0000)
committer Chad Rosier <mcrosier@codeaurora.org>
Wed, 7 Oct 2015 16:15:40 +0000 (16:15 +0000)
diff --git a/lib/Target/ARM/ARMISelLowering.cpp b/lib/Target/ARM/ARMISelLowering.cpp

index 6f886220bd26adfb606760753b3cdcf67f955a4c..cafb4500d1a406d486e489089011cb45af2f2593 100644 (file)
--- a/lib/Target/ARM/ARMISelLowering.cpp
+++ b/lib/Target/ARM/ARMISelLowering.cpp
@@ -9908,10 +9908,12 @@ static SDValue PerformVDIVCombine(SDNode *N, SelectionDAG &DAG,
    uint32_t FloatBits = FloatTy.getSizeInBits();
    MVT IntTy = Op.getOperand(0).getSimpleValueType().getVectorElementType();
    uint32_t IntBits = IntTy.getSizeInBits();
-  if (FloatBits != 32 || IntBits > 32) {
+  unsigned NumLanes = Op.getValueType().getVectorNumElements();
+  if (FloatBits != 32 || IntBits > 32 || NumLanes > 4) {
      // These instructions only exist converting from i32 to f32. We can handle
      // smaller integers by generating an extra extend, but larger ones would
-    // be lossy.
+    // be lossy. We also can't handle more then 4 lanes, since these intructions
+    // only support v2i32/v4i32 types.
      return SDValue();
    }
  
@@ -9922,7 +9924,6 @@ static SDValue PerformVDIVCombine(SDNode *N, SelectionDAG &DAG,
  
    SDLoc dl(N);
    SDValue ConvInput = Op.getOperand(0);
-  unsigned NumLanes = Op.getValueType().getVectorNumElements();
    if (IntBits < FloatBits)
      ConvInput = DAG.getNode(isSigned ? ISD::SIGN_EXTEND : ISD::ZERO_EXTEND,
                              dl, NumLanes == 2 ? MVT::v2i32 : MVT::v4i32,
diff --git a/test/CodeGen/ARM/vdiv_combine.ll b/test/CodeGen/ARM/vdiv_combine.ll

index 8c6e4ba350549a6b97c3db1f9d76a717e830dd9f..dbbf92efd22b1b82c39b152ad7356fe2c261c55f 100644 (file)
--- a/test/CodeGen/ARM/vdiv_combine.ll
+++ b/test/CodeGen/ARM/vdiv_combine.ll
@@ -136,3 +136,11 @@ define <2 x double> @fix_i64_to_double(<2 x i64> %in) {
      ret <2 x double> %shift
  }
  
+; Don't combine with 8 lanes.  Just make sure things don't crash.
+; CHECK-LABEL: test7
+define <8 x float> @test7(<8 x i32> %in) nounwind {
+entry:
+  %vcvt.i = sitofp <8 x i32> %in to <8 x float>
+  %div.i = fdiv <8 x float> %vcvt.i, <float 8.0, float 8.0, float 8.0, float 8.0, float 8.0, float 8.0, float 8.0, float 8.0>
+  ret <8 x float> %div.i
+}
author	Chad Rosier <mcrosier@codeaurora.org>
	Wed, 7 Oct 2015 16:15:40 +0000 (16:15 +0000)
committer	Chad Rosier <mcrosier@codeaurora.org>
	Wed, 7 Oct 2015 16:15:40 +0000 (16:15 +0000)
lib/Target/ARM/ARMISelLowering.cpp		patch \| blob \| history
test/CodeGen/ARM/vdiv_combine.ll		patch \| blob \| history