[CodeGen] Mark the promoted FCOPYSIGN result FP_ROUND as TRUNCating.

author Ahmed Bougacha <ahmed.bougacha@gmail.com>

Thu, 13 Aug 2015 01:32:30 +0000 (01:32 +0000)

committer Ahmed Bougacha <ahmed.bougacha@gmail.com>

Thu, 13 Aug 2015 01:32:30 +0000 (01:32 +0000)
author Ahmed Bougacha <ahmed.bougacha@gmail.com>
Thu, 13 Aug 2015 01:32:30 +0000 (01:32 +0000)
committer Ahmed Bougacha <ahmed.bougacha@gmail.com>
Thu, 13 Aug 2015 01:32:30 +0000 (01:32 +0000)
diff --git a/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp b/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp

index 3b15752e2e440f287f9ba7fae760e966d712f977..552f92bbd46de22ac2eb7b2640e7cbaa3e178471 100644 (file)
--- a/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp
+++ b/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp
@@ -4301,8 +4301,15 @@ void SelectionDAGLegalize::PromoteNode(SDNode *Node) {
      Tmp1 = DAG.getNode(ISD::FP_EXTEND, dl, NVT, Node->getOperand(0));
      Tmp2 = Node->getOperand(1);
      Tmp3 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1, Tmp2);
+
+    // fcopysign doesn't change anything but the sign bit, so
+    //   (fp_round (fcopysign (fpext a), b))
+    // is as precise as
+    //   (fp_round (fpext a))
+    // which is a no-op. Mark it as a TRUNCating FP_ROUND.
+    const bool isTrunc = (Node->getOpcode() == ISD::FCOPYSIGN);
      Results.push_back(DAG.getNode(ISD::FP_ROUND, dl, OVT,
-                                  Tmp3, DAG.getIntPtrConstant(0, dl)));
+                                  Tmp3, DAG.getIntPtrConstant(isTrunc, dl)));
      break;
    }
    case ISD::FFLOOR:
diff --git a/test/CodeGen/AArch64/f16-instructions.ll b/test/CodeGen/AArch64/f16-instructions.ll

index 99dc8e3301486b75d1333e1d023dad5e47d75093..3dd54e6462384e85123d2d07f623078e2f4474f1 100644 (file)
--- a/test/CodeGen/AArch64/f16-instructions.ll
+++ b/test/CodeGen/AArch64/f16-instructions.ll
@@ -702,6 +702,21 @@ define half @test_copysign_f64(half %a, double %b) #0 {
    ret half %r
  }
  
+; Check that the FP promotion will use a truncating FP_ROUND, so we can fold
+; away the (fpext (fp_round <result>)) here.
+
+; CHECK-LABEL: test_copysign_extended:
+; CHECK-NEXT: fcvt s1, h1
+; CHECK-NEXT: fcvt s0, h0
+; CHECK-NEXT: movi.4s v2, #0x80, lsl #24
+; CHECK-NEXT: bit.16b v0, v1, v2
+; CHECK-NEXT: ret
+define float @test_copysign_extended(half %a, half %b) #0 {
+  %r = call half @llvm.copysign.f16(half %a, half %b)
+  %xr = fpext half %r to float
+  ret float %xr
+}
+
  ; CHECK-LABEL: test_floor:
  ; CHECK-NEXT: fcvt [[FLOAT32:s[0-9]+]], h0
  ; CHECK-NEXT: frintm [[INT32:s[0-9]+]], [[FLOAT32]]
author	Ahmed Bougacha <ahmed.bougacha@gmail.com>
	Thu, 13 Aug 2015 01:32:30 +0000 (01:32 +0000)
committer	Ahmed Bougacha <ahmed.bougacha@gmail.com>
	Thu, 13 Aug 2015 01:32:30 +0000 (01:32 +0000)
lib/CodeGen/SelectionDAG/LegalizeDAG.cpp		patch \| blob \| history
test/CodeGen/AArch64/f16-instructions.ll		patch \| blob \| history