Fix cycle in selection DAG introduced by extractelement legalization

author Robert Lougher <rob.lougher@gmail.com>

Wed, 9 Dec 2015 14:34:10 +0000 (14:34 +0000)

committer Robert Lougher <rob.lougher@gmail.com>

Wed, 9 Dec 2015 14:34:10 +0000 (14:34 +0000)
author Robert Lougher <rob.lougher@gmail.com>
Wed, 9 Dec 2015 14:34:10 +0000 (14:34 +0000)
committer Robert Lougher <rob.lougher@gmail.com>
Wed, 9 Dec 2015 14:34:10 +0000 (14:34 +0000)
diff --git a/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp b/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp

index 3393e17b8e097c910d1a0a488f4c5abc0a70fd7e..f46767f6c4a1e4b59c7bdd44ea7e244673ece8b1 100644 (file)
--- a/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp
+++ b/lib/CodeGen/SelectionDAG/LegalizeDAG.cpp
@@ -1463,6 +1463,11 @@ SDValue SelectionDAGLegalize::ExpandExtractFromVectorThroughStack(SDValue Op) {
    // series of EXTRACT_VECTOR_ELT nodes are generated, one for each element in
    // the vector. If all are expanded here, we don't want one store per vector
    // element.
+
+  // Caches for hasPredecessorHelper
+  SmallPtrSet<const SDNode *, 32> Visited;
+  SmallVector<const SDNode *, 16> Worklist;
+
    SDValue StackPtr, Ch;
    for (SDNode::use_iterator UI = Vec.getNode()->use_begin(),
         UE = Vec.getNode()->use_end(); UI != UE; ++UI) {
@@ -1477,6 +1482,12 @@ SDValue SelectionDAGLegalize::ExpandExtractFromVectorThroughStack(SDValue Op) {
        if (!ST->getChain().reachesChainWithoutSideEffects(DAG.getEntryNode()))
          continue;
  
+      // If the index is dependent on the store we will introduce a cycle when
+      // creating the load (the load uses the index, and by replacing the chain
+      // we will make the index dependent on the load).
+      if (Idx.getNode()->hasPredecessorHelper(ST, Visited, Worklist))
+        continue;
+
        StackPtr = ST->getBasePtr();
        Ch = SDValue(ST, 0);
        break;
diff --git a/test/CodeGen/X86/extractelement-legalization-cycle.ll b/test/CodeGen/X86/extractelement-legalization-cycle.ll

new file mode 100644 (file)

index 0000000..d75f03b
--- /dev/null
+++ b/test/CodeGen/X86/extractelement-legalization-cycle.ll
@@ -0,0 +1,21 @@
+; RUN: llc < %s -mtriple=x86_64-unknown-unknown | FileCheck %s
+
+; When the extractelement is converted to a load the store can be re-used.
+; This will, however, introduce a cycle into the selection DAG (the load
+; of the extractelement index is dependent on the store, and so after the
+; conversion it becomes dependent on the new load, which is dependent on
+; the index).  Make sure we skip the store, and conservatively instead
+; use a store to the stack.
+
+define float @foo(i32* %i, <4 x float>* %v) {
+; CHECK-LABEL: foo:
+; CHECK:    movaps %xmm0, -[[OFFSET:[0-9]+]](%rsp)
+; CHECK:    movss -[[OFFSET]](%rsp,{{.*}}), %xmm0 {{.*}}
+; CHECK-NEXT:    retq
+  %1 = load <4 x float>, <4 x float>* %v, align 16
+  %mul = fmul <4 x float> %1, %1
+  store <4 x float> %mul, <4 x float>* %v, align 16
+  %2 = load i32, i32* %i, align 4
+  %vecext = extractelement <4 x float> %mul, i32 %2
+  ret float %vecext
+}
author	Robert Lougher <rob.lougher@gmail.com>
	Wed, 9 Dec 2015 14:34:10 +0000 (14:34 +0000)
committer	Robert Lougher <rob.lougher@gmail.com>
	Wed, 9 Dec 2015 14:34:10 +0000 (14:34 +0000)
lib/CodeGen/SelectionDAG/LegalizeDAG.cpp		patch \| blob \| history
test/CodeGen/X86/extractelement-legalization-cycle.ll	[new file with mode: 0644]	patch \| blob