Lower MEMBARRIER on x86 and support processors without SSE2.

author Eric Christopher <echristo@apple.com>

Wed, 21 Jul 2010 09:05:23 +0000 (09:05 +0000)

committer Eric Christopher <echristo@apple.com>

Wed, 21 Jul 2010 09:05:23 +0000 (09:05 +0000)
author Eric Christopher <echristo@apple.com>
Wed, 21 Jul 2010 09:05:23 +0000 (09:05 +0000)
committer Eric Christopher <echristo@apple.com>
Wed, 21 Jul 2010 09:05:23 +0000 (09:05 +0000)
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index d10f4ec2f92d0a6c783bad71a81065af1d73d368..67a15406d497a19996c5fc436f53c2e9068ecbf4 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -343,8 +343,9 @@ X86TargetLowering::X86TargetLowering(X86TargetMachine &TM)
    if (Subtarget->hasSSE1())
      setOperationAction(ISD::PREFETCH      , MVT::Other, Legal);
  
-  if (!Subtarget->hasSSE2())
-    setOperationAction(ISD::MEMBARRIER    , MVT::Other, Expand);
+  // We may not have a libcall for MEMBARRIER so we should lower this.
+  setOperationAction(ISD::MEMBARRIER    , MVT::Other, Custom);
+  
    // On X86 and X86-64, atomic operations are lowered to locked instructions.
    // Locked instructions, in turn, have implicit fence semantics (all memory
    // operations are flushed before issuing the locked instruction, and they
@@ -7508,6 +7509,16 @@ SDValue X86TargetLowering::LowerXALUO(SDValue Op, SelectionDAG &DAG) const {
    return Sum;
  }
  
+SDValue X86TargetLowering::LowerMEMBARRIER(SDValue Op, SelectionDAG &DAG) const{
+  DebugLoc dl = Op.getDebugLoc();
+  
+  if (!Subtarget->hasSSE2())
+    return DAG.getNode(X86ISD::MEMBARRIER, dl, MVT::Other, Op.getOperand(0),
+                       DAG.getConstant(0, MVT::i32));
+                       
+  return DAG.getNode(X86ISD::MEMBARRIER, dl, MVT::Other, Op.getOperand(0));
+}
+
  SDValue X86TargetLowering::LowerCMP_SWAP(SDValue Op, SelectionDAG &DAG) const {
    EVT T = Op.getValueType();
    DebugLoc dl = Op.getDebugLoc();
@@ -7597,6 +7608,7 @@ SDValue X86TargetLowering::LowerLOAD_SUB(SDValue Op, SelectionDAG &DAG) const {
  SDValue X86TargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) const {
    switch (Op.getOpcode()) {
    default: llvm_unreachable("Should not custom lower this!");
+  case ISD::MEMBARRIER:         return LowerMEMBARRIER(Op,DAG);
    case ISD::ATOMIC_CMP_SWAP:    return LowerCMP_SWAP(Op,DAG);
    case ISD::ATOMIC_LOAD_SUB:    return LowerLOAD_SUB(Op,DAG);
    case ISD::BUILD_VECTOR:       return LowerBUILD_VECTOR(Op, DAG);
diff --git a/lib/Target/X86/X86ISelLowering.h b/lib/Target/X86/X86ISelLowering.h

index 4e4daa4bc5ca9def3eb3b6907ffa221d1a205a4c..221fff2fd44918af11b8c65193456f7aa051d3f2 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.h
+++ b/lib/Target/X86/X86ISelLowering.h
@@ -265,7 +265,10 @@ namespace llvm {
        ATOMXOR64_DAG,
        ATOMAND64_DAG,
        ATOMNAND64_DAG,
-      ATOMSWAP64_DAG
+      ATOMSWAP64_DAG,
+      
+      // Memory barrier
+      MEMBARRIER
  
        // WARNING: Do not add anything in the end unless you want the node to
        // have memop! In fact, starting from ATOMADD64_DAG all opcodes will be
@@ -715,6 +718,7 @@ namespace llvm {
      SDValue LowerCMP_SWAP(SDValue Op, SelectionDAG &DAG) const;
      SDValue LowerLOAD_SUB(SDValue Op, SelectionDAG &DAG) const;
      SDValue LowerREADCYCLECOUNTER(SDValue Op, SelectionDAG &DAG) const;
+    SDValue LowerMEMBARRIER(SDValue Op, SelectionDAG &DAG) const;
  
      virtual SDValue
        LowerFormalArguments(SDValue Chain,
diff --git a/lib/Target/X86/X86InstrInfo.td b/lib/Target/X86/X86InstrInfo.td

index 6917a9db6480f5497a59db3722f154d43de5f0df..d40ba69ddc21d63fd5df12a8a5a71d90c9adacf6 100644 (file)
--- a/lib/Target/X86/X86InstrInfo.td
+++ b/lib/Target/X86/X86InstrInfo.td
@@ -80,6 +80,14 @@ def SDT_X86EHRET : SDTypeProfile<0, 1, [SDTCisInt<0>]>;
  
  def SDT_X86TCRET : SDTypeProfile<0, 2, [SDTCisPtrTy<0>, SDTCisVT<1, i32>]>;
  
+def SDT_X86MEMBARRIER : SDTypeProfile<0, 0, []>;
+def SDT_X86MEMBARRIERNoSSE : SDTypeProfile<0, 1, [SDTCisInt<0>]>;
+
+def X86MemBarrier : SDNode<"X86ISD::MEMBARRIER", SDT_X86MEMBARRIER,
+                            [SDNPHasChain]>;
+def X86MemBarrierNoSSE : SDNode<"X86ISD::MEMBARRIER", SDT_X86MEMBARRIERNoSSE,
+                                [SDNPHasChain]>;
+
  def X86bsf     : SDNode<"X86ISD::BSF",      SDTUnaryArithWithFlags>;
  def X86bsr     : SDNode<"X86ISD::BSR",      SDTUnaryArithWithFlags>;
  def X86shld    : SDNode<"X86ISD::SHLD",     SDTIntShiftDOp>;
@@ -3906,6 +3914,19 @@ def EH_RETURN   : I<0xC3, RawFrm, (outs), (ins GR32:$addr),
  // Atomic support
  //
  
+// Memory barriers
+let hasSideEffects = 1 in {
+def Int_MemBarrier : I<0, Pseudo, (outs), (ins),
+                     "#MEMBARRIER",
+                     [(X86MemBarrier)]>, Requires<[HasSSE2]>;
+               
+let Uses = [ESP], isCodeGenOnly = 1 in
+def Int_MemBarrierNoSSE  : I<0x0B, Pseudo, (outs), (ins GR32:$zero),
+                           "lock\n\t"
+                           "or{l}\t{$zero, (%esp)|(%esp), $zero}",
+                           [(X86MemBarrierNoSSE GR32:$zero)]>, LOCK;
+}
+
  // Atomic swap. These are just normal xchg instructions. But since a memory
  // operand is referenced, the atomicity is ensured.
  let Constraints = "$val = $dst" in {
author	Eric Christopher <echristo@apple.com>
	Wed, 21 Jul 2010 09:05:23 +0000 (09:05 +0000)
committer	Eric Christopher <echristo@apple.com>
	Wed, 21 Jul 2010 09:05:23 +0000 (09:05 +0000)
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
lib/Target/X86/X86ISelLowering.h		patch \| blob \| history
lib/Target/X86/X86InstrInfo.td		patch \| blob \| history