lib/Target/X86/X86ISelDAGToDAG.cpp

   1 //===- X86ISelDAGToDAG.cpp - A DAG pattern matching inst selector for X86 -===//
   2 //
   3 //                     The LLVM Compiler Infrastructure
   4 //
   5 // This file was developed by the Evan Cheng and is distributed under
   6 // the University of Illinois Open Source License. See LICENSE.TXT for details.
   7 //
   8 //===----------------------------------------------------------------------===//
   9 //
  10 // This file defines a DAG pattern matching instruction selector for X86,
  11 // converting from a legalized dag to a X86 dag.
  12 //
  13 //===----------------------------------------------------------------------===//
  14
  15 #define DEBUG_TYPE "x86-isel"
  16 #include "X86.h"
  17 #include "X86InstrBuilder.h"
  18 #include "X86ISelLowering.h"
  19 #include "X86RegisterInfo.h"
  20 #include "X86Subtarget.h"
  21 #include "X86TargetMachine.h"
  22 #include "llvm/GlobalValue.h"
  23 #include "llvm/Instructions.h"
  24 #include "llvm/Intrinsics.h"
  25 #include "llvm/Support/CFG.h"
  26 #include "llvm/CodeGen/MachineConstantPool.h"
  27 #include "llvm/CodeGen/MachineFunction.h"
  28 #include "llvm/CodeGen/MachineFrameInfo.h"
  29 #include "llvm/CodeGen/MachineInstrBuilder.h"
  30 #include "llvm/CodeGen/SSARegMap.h"
  31 #include "llvm/CodeGen/SelectionDAGISel.h"
  32 #include "llvm/Target/TargetMachine.h"
  33 #include "llvm/Support/Compiler.h"
  34 #include "llvm/Support/Debug.h"
  35 #include "llvm/Support/MathExtras.h"
  36 #include "llvm/ADT/Statistic.h"
  37 #include <deque>
  38 #include <iostream>
  39 #include <queue>
  40 #include <set>
  41 using namespace llvm;
  42
  43 //===----------------------------------------------------------------------===//
  44 //                      Pattern Matcher Implementation
  45 //===----------------------------------------------------------------------===//
  46
  47 namespace {
  48   /// X86ISelAddressMode - This corresponds to X86AddressMode, but uses
  49   /// SDOperand's instead of register numbers for the leaves of the matched
  50   /// tree.
  51   struct X86ISelAddressMode {
  52     enum {
  53       RegBase,
  54       FrameIndexBase
  55     } BaseType;
  56
  57     struct {            // This is really a union, discriminated by BaseType!
  58       SDOperand Reg;
  59       int FrameIndex;
  60     } Base;
  61
  62     bool isRIPRel;     // RIP relative?
  63     unsigned Scale;
  64     SDOperand IndexReg;
  65     unsigned Disp;
  66     GlobalValue *GV;
  67     Constant *CP;
  68     const char *ES;
  69     int JT;
  70     unsigned Align;    // CP alignment.
  71
  72     X86ISelAddressMode()
  73       : BaseType(RegBase), isRIPRel(false), Scale(1), IndexReg(), Disp(0),
  74         GV(0), CP(0), ES(0), JT(-1), Align(0) {
  75     }
  76   };
  77 }
  78
  79 namespace {
  80   Statistic<>
  81   NumFPKill("x86-codegen", "Number of FP_REG_KILL instructions added");
  82
  83   Statistic<>
  84   NumLoadMoved("x86-codegen", "Number of loads moved below TokenFactor");
  85
  86   //===--------------------------------------------------------------------===//
  87   /// ISel - X86 specific code to select X86 machine instructions for
  88   /// SelectionDAG operations.
  89   ///
  90   class VISIBILITY_HIDDEN X86DAGToDAGISel : public SelectionDAGISel {
  91     /// ContainsFPCode - Every instruction we select that uses or defines a FP
  92     /// register should set this to true.
  93     bool ContainsFPCode;
  94
  95     /// FastISel - Enable fast(er) instruction selection.
  96     ///
  97     bool FastISel;
  98
  99     /// TM - Keep a reference to X86TargetMachine.
 100     ///
 101     X86TargetMachine &TM;
 102
 103     /// X86Lowering - This object fully describes how to lower LLVM code to an
 104     /// X86-specific SelectionDAG.
 105     X86TargetLowering X86Lowering;
 106
 107     /// Subtarget - Keep a pointer to the X86Subtarget around so that we can
 108     /// make the right decision when generating code for different targets.
 109     const X86Subtarget *Subtarget;
 110
 111     /// GlobalBaseReg - keeps track of the virtual register mapped onto global
 112     /// base register.
 113     unsigned GlobalBaseReg;
 114
 115   public:
 116     X86DAGToDAGISel(X86TargetMachine &tm, bool fast)
 117       : SelectionDAGISel(X86Lowering),
 118         ContainsFPCode(false), FastISel(fast), TM(tm),
 119         X86Lowering(*TM.getTargetLowering()),
 120         Subtarget(&TM.getSubtarget<X86Subtarget>()) {}
 121
 122     virtual bool runOnFunction(Function &Fn) {
 123       // Make sure we re-emit a set of the global base reg if necessary
 124       GlobalBaseReg = 0;
 125       return SelectionDAGISel::runOnFunction(Fn);
 126     }
 127
 128     virtual const char *getPassName() const {
 129       return "X86 DAG->DAG Instruction Selection";
 130     }
 131
 132     /// InstructionSelectBasicBlock - This callback is invoked by
 133     /// SelectionDAGISel when it has created a SelectionDAG for us to codegen.
 134     virtual void InstructionSelectBasicBlock(SelectionDAG &DAG);
 135
 136     virtual void EmitFunctionEntryCode(Function &Fn, MachineFunction &MF);
 137
 138     virtual bool CanBeFoldedBy(SDNode *N, SDNode *U);
 139
 140 // Include the pieces autogenerated from the target description.
 141 #include "X86GenDAGISel.inc"
 142
 143   private:
 144     SDNode *Select(SDOperand N);
 145
 146     bool MatchAddress(SDOperand N, X86ISelAddressMode &AM, bool isRoot = true);
 147     bool SelectAddr(SDOperand N, SDOperand &Base, SDOperand &Scale,
 148                     SDOperand &Index, SDOperand &Disp);
 149     bool SelectLEAAddr(SDOperand N, SDOperand &Base, SDOperand &Scale,
 150                        SDOperand &Index, SDOperand &Disp);
 151     bool TryFoldLoad(SDOperand P, SDOperand N,
 152                      SDOperand &Base, SDOperand &Scale,
 153                      SDOperand &Index, SDOperand &Disp);
 154     void InstructionSelectPreprocess(SelectionDAG &DAG);
 155
 156     /// SelectInlineAsmMemoryOperand - Implement addressing mode selection for
 157     /// inline asm expressions.
 158     virtual bool SelectInlineAsmMemoryOperand(const SDOperand &Op,
 159                                               char ConstraintCode,
 160                                               std::vector<SDOperand> &OutOps,
 161                                               SelectionDAG &DAG);
 162
 163     void EmitSpecialCodeForMain(MachineBasicBlock *BB, MachineFrameInfo *MFI);
 164
 165     inline void getAddressOperands(X86ISelAddressMode &AM, SDOperand &Base,
 166                                    SDOperand &Scale, SDOperand &Index,
 167                                    SDOperand &Disp) {
 168       Base  = (AM.BaseType == X86ISelAddressMode::FrameIndexBase) ?
 169         CurDAG->getTargetFrameIndex(AM.Base.FrameIndex, TLI.getPointerTy()) :
 170         AM.Base.Reg;
 171       Scale = getI8Imm(AM.Scale);
 172       Index = AM.IndexReg;
 173       // These are 32-bit even in 64-bit mode since RIP relative offset
 174       // is 32-bit.
 175       if (AM.GV)
 176         Disp = CurDAG->getTargetGlobalAddress(AM.GV, MVT::i32, AM.Disp);
 177       else if (AM.CP)
 178         Disp = CurDAG->getTargetConstantPool(AM.CP, MVT::i32, AM.Align, AM.Disp);
 179       else if (AM.ES)
 180         Disp = CurDAG->getTargetExternalSymbol(AM.ES, MVT::i32);
 181       else if (AM.JT != -1)
 182         Disp = CurDAG->getTargetJumpTable(AM.JT, MVT::i32);
 183       else
 184         Disp = getI32Imm(AM.Disp);
 185     }
 186
 187     /// getI8Imm - Return a target constant with the specified value, of type
 188     /// i8.
 189     inline SDOperand getI8Imm(unsigned Imm) {
 190       return CurDAG->getTargetConstant(Imm, MVT::i8);
 191     }
 192
 193     /// getI16Imm - Return a target constant with the specified value, of type
 194     /// i16.
 195     inline SDOperand getI16Imm(unsigned Imm) {
 196       return CurDAG->getTargetConstant(Imm, MVT::i16);
 197     }
 198
 199     /// getI32Imm - Return a target constant with the specified value, of type
 200     /// i32.
 201     inline SDOperand getI32Imm(unsigned Imm) {
 202       return CurDAG->getTargetConstant(Imm, MVT::i32);
 203     }
 204
 205     /// getGlobalBaseReg - insert code into the entry mbb to materialize the PIC
 206     /// base register.  Return the virtual register that holds this value.
 207     SDNode *getGlobalBaseReg();
 208
 209 #ifndef NDEBUG
 210     unsigned Indent;
 211 #endif
 212   };
 213 }
 214
 215 static void findNonImmUse(SDNode* Use, SDNode* Def, bool &found,
 216                           std::set<SDNode *> &Visited) {
 217   if (found ||
 218       Use->getNodeId() > Def->getNodeId() ||
 219       !Visited.insert(Use).second)
 220     return;
 221
 222   for (unsigned i = 0, e = Use->getNumOperands(); i != e; ++i) {
 223     SDNode *N = Use->getOperand(i).Val;
 224     if (N != Def) {
 225       findNonImmUse(N, Def, found, Visited);
 226     } else {
 227       found = true;
 228       break;
 229     }
 230   }
 231 }
 232
 233 static inline bool isNonImmUse(SDNode* Use, SDNode* Def) {
 234   std::set<SDNode *> Visited;
 235   bool found = false;
 236   for (unsigned i = 0, e = Use->getNumOperands(); i != e; ++i) {
 237     SDNode *N = Use->getOperand(i).Val;
 238     if (N != Def) {
 239       findNonImmUse(N, Def, found, Visited);
 240       if (found) break;
 241     }
 242   }
 243   return found;
 244 }
 245
 246
 247 bool X86DAGToDAGISel::CanBeFoldedBy(SDNode *N, SDNode *U) {
 248   // If U use can somehow reach N through another path then U can't fold N or
 249   // it will create a cycle. e.g. In the following diagram, U can reach N
 250   // through X. If N is folded into into U, then X is both a predecessor and
 251   // a successor of U.
 252   //
 253   //         [ N ]
 254   //         ^  ^
 255   //         |  |
 256   //        /   \---
 257   //      /        [X]
 258   //      |         ^
 259   //     [U]--------|
 260   return !FastISel && !isNonImmUse(U, N);
 261 }
 262
 263 /// MoveBelowTokenFactor - Replace TokenFactor operand with load's chain operand
 264 /// and move load below the TokenFactor. Replace store's chain operand with
 265 /// load's chain result.
 266 static void MoveBelowTokenFactor(SelectionDAG &DAG, SDOperand Load,
 267                                  SDOperand Store, SDOperand TF) {
 268   std::vector<SDOperand> Ops;
 269   for (unsigned i = 0, e = TF.Val->getNumOperands(); i != e; ++i)
 270     if (Load.Val == TF.Val->getOperand(i).Val)
 271       Ops.push_back(Load.Val->getOperand(0));
 272     else
 273       Ops.push_back(TF.Val->getOperand(i));
 274   DAG.UpdateNodeOperands(TF, &Ops[0], Ops.size());
 275   DAG.UpdateNodeOperands(Load, TF, Load.getOperand(1), Load.getOperand(2));
 276   DAG.UpdateNodeOperands(Store, Load.getValue(1), Store.getOperand(1),
 277                          Store.getOperand(2), Store.getOperand(3));
 278 }
 279
 280 /// InstructionSelectPreprocess - Preprocess the DAG to allow the instruction
 281 /// selector to pick more load-modify-store instructions. This is a common
 282 /// case:
 283 ///
 284 ///     [Load chain]
 285 ///         ^
 286 ///         |
 287 ///       [Load]
 288 ///       ^    ^
 289 ///       |    |
 290 ///      /      \-
 291 ///     /         |
 292 /// [TokenFactor] [Op]
 293 ///     ^          ^
 294 ///     |          |
 295 ///      \        /
 296 ///       \      /
 297 ///       [Store]
 298 ///
 299 /// The fact the store's chain operand != load's chain will prevent the
 300 /// (store (op (load))) instruction from being selected. We can transform it to:
 301 ///
 302 ///     [Load chain]
 303 ///         ^
 304 ///         |
 305 ///    [TokenFactor]
 306 ///         ^
 307 ///         |
 308 ///       [Load]
 309 ///       ^    ^
 310 ///       |    |
 311 ///       |     \-
 312 ///       |       |
 313 ///       |     [Op]
 314 ///       |       ^
 315 ///       |       |
 316 ///       \      /
 317 ///        \    /
 318 ///       [Store]
 319 void X86DAGToDAGISel::InstructionSelectPreprocess(SelectionDAG &DAG) {
 320   for (SelectionDAG::allnodes_iterator I = DAG.allnodes_begin(),
 321          E = DAG.allnodes_end(); I != E; ++I) {
 322     if (I->getOpcode() != ISD::STORE)
 323       continue;
 324     SDOperand Chain = I->getOperand(0);
 325     if (Chain.Val->getOpcode() != ISD::TokenFactor)
 326       continue;
 327
 328     SDOperand N1 = I->getOperand(1);
 329     SDOperand N2 = I->getOperand(2);
 330     if (MVT::isFloatingPoint(N1.getValueType()) ||
 331         MVT::isVector(N1.getValueType()) ||
 332         !N1.hasOneUse())
 333       continue;
 334
 335     bool RModW = false;
 336     SDOperand Load;
 337     unsigned Opcode = N1.Val->getOpcode();
 338     switch (Opcode) {
 339       case ISD::ADD:
 340       case ISD::MUL:
 341       case ISD::AND:
 342       case ISD::OR:
 343       case ISD::XOR:
 344       case ISD::ADDC:
 345       case ISD::ADDE: {
 346         SDOperand N10 = N1.getOperand(0);
 347         SDOperand N11 = N1.getOperand(1);
 348         if (N10.Val->getOpcode() == ISD::LOAD)
 349           RModW = true;
 350         else if (N11.Val->getOpcode() == ISD::LOAD) {
 351           RModW = true;
 352           std::swap(N10, N11);
 353         }
 354         RModW = RModW && N10.Val->isOperand(Chain.Val) && N10.hasOneUse() &&
 355           (N10.getOperand(1) == N2) &&
 356           (N10.Val->getValueType(0) == N1.getValueType());
 357         if (RModW)
 358           Load = N10;
 359         break;
 360       }
 361       case ISD::SUB:
 362       case ISD::SHL:
 363       case ISD::SRA:
 364       case ISD::SRL:
 365       case ISD::ROTL:
 366       case ISD::ROTR:
 367       case ISD::SUBC:
 368       case ISD::SUBE:
 369       case X86ISD::SHLD:
 370       case X86ISD::SHRD: {
 371         SDOperand N10 = N1.getOperand(0);
 372         if (N10.Val->getOpcode() == ISD::LOAD)
 373           RModW = N10.Val->isOperand(Chain.Val) && N10.hasOneUse() &&
 374             (N10.getOperand(1) == N2) &&
 375             (N10.Val->getValueType(0) == N1.getValueType());
 376         if (RModW)
 377           Load = N10;
 378         break;
 379       }
 380     }
 381
 382     if (RModW) {
 383       MoveBelowTokenFactor(DAG, Load, SDOperand(I, 0), Chain);
 384       ++NumLoadMoved;
 385     }
 386   }
 387 }
 388
 389 /// InstructionSelectBasicBlock - This callback is invoked by SelectionDAGISel
 390 /// when it has created a SelectionDAG for us to codegen.
 391 void X86DAGToDAGISel::InstructionSelectBasicBlock(SelectionDAG &DAG) {
 392   DEBUG(BB->dump());
 393   MachineFunction::iterator FirstMBB = BB;
 394
 395   if (!FastISel)
 396     InstructionSelectPreprocess(DAG);
 397
 398   // Codegen the basic block.
 399 #ifndef NDEBUG
 400   DEBUG(std::cerr << "===== Instruction selection begins:\n");
 401   Indent = 0;
 402 #endif
 403   DAG.setRoot(SelectRoot(DAG.getRoot()));
 404 #ifndef NDEBUG
 405   DEBUG(std::cerr << "===== Instruction selection ends:\n");
 406 #endif
 407
 408   DAG.RemoveDeadNodes();
 409
 410   // Emit machine code to BB.
 411   ScheduleAndEmitDAG(DAG);
 412
 413   // If we are emitting FP stack code, scan the basic block to determine if this
 414   // block defines any FP values.  If so, put an FP_REG_KILL instruction before
 415   // the terminator of the block.
 416   if (!Subtarget->hasSSE2()) {
 417     // Note that FP stack instructions *are* used in SSE code when returning
 418     // values, but these are not live out of the basic block, so we don't need
 419     // an FP_REG_KILL in this case either.
 420     bool ContainsFPCode = false;
 421
 422     // Scan all of the machine instructions in these MBBs, checking for FP
 423     // stores.
 424     MachineFunction::iterator MBBI = FirstMBB;
 425     do {
 426       for (MachineBasicBlock::iterator I = MBBI->begin(), E = MBBI->end();
 427            !ContainsFPCode && I != E; ++I) {
 428         for (unsigned op = 0, e = I->getNumOperands(); op != e; ++op) {
 429           if (I->getOperand(op).isRegister() && I->getOperand(op).isDef() &&
 430               MRegisterInfo::isVirtualRegister(I->getOperand(op).getReg()) &&
 431               RegMap->getRegClass(I->getOperand(0).getReg()) ==
 432                 X86::RFPRegisterClass) {
 433             ContainsFPCode = true;
 434             break;
 435           }
 436         }
 437       }
 438     } while (!ContainsFPCode && &*(MBBI++) != BB);
 439
 440     // Check PHI nodes in successor blocks.  These PHI's will be lowered to have
 441     // a copy of the input value in this block.
 442     if (!ContainsFPCode) {
 443       // Final check, check LLVM BB's that are successors to the LLVM BB
 444       // corresponding to BB for FP PHI nodes.
 445       const BasicBlock *LLVMBB = BB->getBasicBlock();
 446       const PHINode *PN;
 447       for (succ_const_iterator SI = succ_begin(LLVMBB), E = succ_end(LLVMBB);
 448            !ContainsFPCode && SI != E; ++SI) {
 449         for (BasicBlock::const_iterator II = SI->begin();
 450              (PN = dyn_cast<PHINode>(II)); ++II) {
 451           if (PN->getType()->isFloatingPoint()) {
 452             ContainsFPCode = true;
 453             break;
 454           }
 455         }
 456       }
 457     }
 458
 459     // Finally, if we found any FP code, emit the FP_REG_KILL instruction.
 460     if (ContainsFPCode) {
 461       BuildMI(*BB, BB->getFirstTerminator(), X86::FP_REG_KILL, 0);
 462       ++NumFPKill;
 463     }
 464   }
 465 }
 466
 467 /// EmitSpecialCodeForMain - Emit any code that needs to be executed only in
 468 /// the main function.
 469 void X86DAGToDAGISel::EmitSpecialCodeForMain(MachineBasicBlock *BB,
 470                                              MachineFrameInfo *MFI) {
 471   if (Subtarget->TargetType == X86Subtarget::isCygwin)
 472     BuildMI(BB, X86::CALLpcrel32, 1).addExternalSymbol("__main");
 473
 474   // Switch the FPU to 64-bit precision mode for better compatibility and speed.
 475   int CWFrameIdx = MFI->CreateStackObject(2, 2);
 476   addFrameReference(BuildMI(BB, X86::FNSTCW16m, 4), CWFrameIdx);
 477
 478   // Set the high part to be 64-bit precision.
 479   addFrameReference(BuildMI(BB, X86::MOV8mi, 5),
 480                     CWFrameIdx, 1).addImm(2);
 481
 482   // Reload the modified control word now.
 483   addFrameReference(BuildMI(BB, X86::FLDCW16m, 4), CWFrameIdx);
 484 }
 485
 486 void X86DAGToDAGISel::EmitFunctionEntryCode(Function &Fn, MachineFunction &MF) {
 487   // If this is main, emit special code for main.
 488   MachineBasicBlock *BB = MF.begin();
 489   if (Fn.hasExternalLinkage() && Fn.getName() == "main")
 490     EmitSpecialCodeForMain(BB, MF.getFrameInfo());
 491 }
 492
 493 /// MatchAddress - Add the specified node to the specified addressing mode,
 494 /// returning true if it cannot be done.  This just pattern matches for the
 495 /// addressing mode
 496 bool X86DAGToDAGISel::MatchAddress(SDOperand N, X86ISelAddressMode &AM,
 497                                    bool isRoot) {
 498   // RIP relative addressing: %rip + 32-bit displacement!
 499   if (AM.isRIPRel) {
 500     if (!AM.ES && AM.JT != -1 && N.getOpcode() == ISD::Constant) {
 501       int64_t Val = cast<ConstantSDNode>(N)->getSignExtended();
 502       if (isInt32(AM.Disp + Val)) {
 503         AM.Disp += Val;
 504         return false;
 505       }
 506     }
 507     return true;
 508   }
 509
 510   int id = N.Val->getNodeId();
 511   bool Available = isSelected(id);
 512
 513   switch (N.getOpcode()) {
 514   default: break;
 515   case ISD::Constant: {
 516     int64_t Val = cast<ConstantSDNode>(N)->getSignExtended();
 517     if (isInt32(AM.Disp + Val)) {
 518       AM.Disp += Val;
 519       return false;
 520     }
 521     break;
 522   }
 523
 524   case X86ISD::Wrapper:
 525     // If value is available in a register both base and index components have
 526     // been picked, we can't fit the result available in the register in the
 527     // addressing mode. Duplicate GlobalAddress or ConstantPool as displacement.
 528
 529     // Can't fit GV or CP in addressing mode for X86-64 medium or large code
 530     // model since the displacement field is 32-bit. Ok for small code model.
 531
 532     // For X86-64 PIC code, only allow GV / CP + displacement so we can use RIP
 533     // relative addressing mode.
 534     if ((!Subtarget->is64Bit() || TM.getCodeModel() == CodeModel::Small) &&
 535         (!Available || (AM.Base.Reg.Val && AM.IndexReg.Val))) {
 536       bool isRIP = Subtarget->is64Bit();
 537       if (isRIP && (AM.Base.Reg.Val || AM.Scale > 1 || AM.IndexReg.Val ||
 538                     AM.BaseType == X86ISelAddressMode::FrameIndexBase))
 539         break;
 540       if (ConstantPoolSDNode *CP =
 541           dyn_cast<ConstantPoolSDNode>(N.getOperand(0))) {
 542         if (AM.CP == 0) {
 543           AM.CP = CP->getConstVal();
 544           AM.Align = CP->getAlignment();
 545           AM.Disp += CP->getOffset();
 546           if (isRIP)
 547             AM.isRIPRel = true;
 548           return false;
 549         }
 550       } else if (GlobalAddressSDNode *G =
 551                  dyn_cast<GlobalAddressSDNode>(N.getOperand(0))) {
 552         if (AM.GV == 0) {
 553           AM.GV = G->getGlobal();
 554           AM.Disp += G->getOffset();
 555           if (isRIP)
 556             AM.isRIPRel = true;
 557           return false;
 558         }
 559       } else if (isRoot && isRIP) {
 560         if (ExternalSymbolSDNode *S =
 561             dyn_cast<ExternalSymbolSDNode>(N.getOperand(0))) {
 562           AM.ES = S->getSymbol();
 563           AM.isRIPRel = true;
 564           return false;
 565         } else if (JumpTableSDNode *J =
 566                    dyn_cast<JumpTableSDNode>(N.getOperand(0))) {
 567           AM.JT = J->getIndex();
 568           AM.isRIPRel = true;
 569           return false;
 570         }
 571       }
 572     }
 573     break;
 574
 575   case ISD::FrameIndex:
 576     if (AM.BaseType == X86ISelAddressMode::RegBase && AM.Base.Reg.Val == 0) {
 577       AM.BaseType = X86ISelAddressMode::FrameIndexBase;
 578       AM.Base.FrameIndex = cast<FrameIndexSDNode>(N)->getIndex();
 579       return false;
 580     }
 581     break;
 582
 583   case ISD::SHL:
 584     if (!Available && AM.IndexReg.Val == 0 && AM.Scale == 1)
 585       if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.Val->getOperand(1))) {
 586         unsigned Val = CN->getValue();
 587         if (Val == 1 || Val == 2 || Val == 3) {
 588           AM.Scale = 1 << Val;
 589           SDOperand ShVal = N.Val->getOperand(0);
 590
 591           // Okay, we know that we have a scale by now.  However, if the scaled
 592           // value is an add of something and a constant, we can fold the
 593           // constant into the disp field here.
 594           if (ShVal.Val->getOpcode() == ISD::ADD && ShVal.hasOneUse() &&
 595               isa<ConstantSDNode>(ShVal.Val->getOperand(1))) {
 596             AM.IndexReg = ShVal.Val->getOperand(0);
 597             ConstantSDNode *AddVal =
 598               cast<ConstantSDNode>(ShVal.Val->getOperand(1));
 599             uint64_t Disp = AM.Disp + AddVal->getValue() << Val;
 600             if (isInt32(Disp))
 601               AM.Disp = Disp;
 602             else
 603               AM.IndexReg = ShVal;
 604           } else {
 605             AM.IndexReg = ShVal;
 606           }
 607           return false;
 608         }
 609       }
 610     break;
 611
 612   case ISD::MUL:
 613     // X*[3,5,9] -> X+X*[2,4,8]
 614     if (!Available &&
 615         AM.BaseType == X86ISelAddressMode::RegBase &&
 616         AM.Base.Reg.Val == 0 &&
 617         AM.IndexReg.Val == 0)
 618       if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.Val->getOperand(1)))
 619         if (CN->getValue() == 3 || CN->getValue() == 5 || CN->getValue() == 9) {
 620           AM.Scale = unsigned(CN->getValue())-1;
 621
 622           SDOperand MulVal = N.Val->getOperand(0);
 623           SDOperand Reg;
 624
 625           // Okay, we know that we have a scale by now.  However, if the scaled
 626           // value is an add of something and a constant, we can fold the
 627           // constant into the disp field here.
 628           if (MulVal.Val->getOpcode() == ISD::ADD && MulVal.hasOneUse() &&
 629               isa<ConstantSDNode>(MulVal.Val->getOperand(1))) {
 630             Reg = MulVal.Val->getOperand(0);
 631             ConstantSDNode *AddVal =
 632               cast<ConstantSDNode>(MulVal.Val->getOperand(1));
 633             uint64_t Disp = AM.Disp + AddVal->getValue() * CN->getValue();
 634             if (isInt32(Disp))
 635               AM.Disp = Disp;
 636             else
 637               Reg = N.Val->getOperand(0);
 638           } else {
 639             Reg = N.Val->getOperand(0);
 640           }
 641
 642           AM.IndexReg = AM.Base.Reg = Reg;
 643           return false;
 644         }
 645     break;
 646
 647   case ISD::ADD: {
 648     if (!Available) {
 649       X86ISelAddressMode Backup = AM;
 650       if (!MatchAddress(N.Val->getOperand(0), AM, false) &&
 651           !MatchAddress(N.Val->getOperand(1), AM, false))
 652         return false;
 653       AM = Backup;
 654       if (!MatchAddress(N.Val->getOperand(1), AM, false) &&
 655           !MatchAddress(N.Val->getOperand(0), AM, false))
 656         return false;
 657       AM = Backup;
 658     }
 659     break;
 660   }
 661
 662   case ISD::OR: {
 663     if (!Available) {
 664       X86ISelAddressMode Backup = AM;
 665       // Look for (x << c1) | c2 where (c2 < c1)
 666       ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.Val->getOperand(0));
 667       if (CN && !MatchAddress(N.Val->getOperand(1), AM, false)) {
 668         if (AM.GV == NULL && AM.Disp == 0 && CN->getValue() < AM.Scale) {
 669           AM.Disp = CN->getValue();
 670           return false;
 671         }
 672       }
 673       AM = Backup;
 674       CN = dyn_cast<ConstantSDNode>(N.Val->getOperand(1));
 675       if (CN && !MatchAddress(N.Val->getOperand(0), AM, false)) {
 676         if (AM.GV == NULL && AM.Disp == 0 && CN->getValue() < AM.Scale) {
 677           AM.Disp = CN->getValue();
 678           return false;
 679         }
 680       }
 681       AM = Backup;
 682     }
 683     break;
 684   }
 685   }
 686
 687   // Is the base register already occupied?
 688   if (AM.BaseType != X86ISelAddressMode::RegBase || AM.Base.Reg.Val) {
 689     // If so, check to see if the scale index register is set.
 690     if (AM.IndexReg.Val == 0) {
 691       AM.IndexReg = N;
 692       AM.Scale = 1;
 693       return false;
 694     }
 695
 696     // Otherwise, we cannot select it.
 697     return true;
 698   }
 699
 700   // Default, generate it as a register.
 701   AM.BaseType = X86ISelAddressMode::RegBase;
 702   AM.Base.Reg = N;
 703   return false;
 704 }
 705
 706 /// SelectAddr - returns true if it is able pattern match an addressing mode.
 707 /// It returns the operands which make up the maximal addressing mode it can
 708 /// match by reference.
 709 bool X86DAGToDAGISel::SelectAddr(SDOperand N, SDOperand &Base, SDOperand &Scale,
 710                                  SDOperand &Index, SDOperand &Disp) {
 711   X86ISelAddressMode AM;
 712   if (MatchAddress(N, AM))
 713     return false;
 714
 715   MVT::ValueType VT = N.getValueType();
 716   if (AM.BaseType == X86ISelAddressMode::RegBase) {
 717     if (!AM.Base.Reg.Val)
 718       AM.Base.Reg = CurDAG->getRegister(0, VT);
 719   }
 720
 721   if (!AM.IndexReg.Val)
 722     AM.IndexReg = CurDAG->getRegister(0, VT);
 723
 724   getAddressOperands(AM, Base, Scale, Index, Disp);
 725   return true;
 726 }
 727
 728 /// SelectLEAAddr - it calls SelectAddr and determines if the maximal addressing
 729 /// mode it matches can be cost effectively emitted as an LEA instruction.
 730 bool X86DAGToDAGISel::SelectLEAAddr(SDOperand N, SDOperand &Base,
 731                                     SDOperand &Scale,
 732                                     SDOperand &Index, SDOperand &Disp) {
 733   X86ISelAddressMode AM;
 734   if (MatchAddress(N, AM))
 735     return false;
 736
 737   MVT::ValueType VT = N.getValueType();
 738   unsigned Complexity = 0;
 739   if (AM.BaseType == X86ISelAddressMode::RegBase)
 740     if (AM.Base.Reg.Val)
 741       Complexity = 1;
 742     else
 743       AM.Base.Reg = CurDAG->getRegister(0, VT);
 744   else if (AM.BaseType == X86ISelAddressMode::FrameIndexBase)
 745     Complexity = 4;
 746
 747   if (AM.IndexReg.Val)
 748     Complexity++;
 749   else
 750     AM.IndexReg = CurDAG->getRegister(0, VT);
 751
 752   if (AM.Scale > 2)
 753     Complexity += 2;
 754   // Don't match just leal(,%reg,2). It's cheaper to do addl %reg, %reg
 755   else if (AM.Scale > 1)
 756     Complexity++;
 757
 758   // FIXME: We are artificially lowering the criteria to turn ADD %reg, $GA
 759   // to a LEA. This is determined with some expermentation but is by no means
 760   // optimal (especially for code size consideration). LEA is nice because of
 761   // its three-address nature. Tweak the cost function again when we can run
 762   // convertToThreeAddress() at register allocation time.
 763   if (AM.GV || AM.CP || AM.ES || AM.JT != -1) {
 764     // For X86-64, we should always use lea to materialize RIP relative
 765     // addresses.
 766     if (Subtarget->is64Bit())
 767       Complexity = 4;
 768     else
 769       Complexity += 2;
 770   }
 771
 772   if (AM.Disp && (AM.Base.Reg.Val || AM.IndexReg.Val))
 773     Complexity++;
 774
 775   if (Complexity > 2) {
 776     getAddressOperands(AM, Base, Scale, Index, Disp);
 777     return true;
 778   }
 779   return false;
 780 }
 781
 782 bool X86DAGToDAGISel::TryFoldLoad(SDOperand P, SDOperand N,
 783                                   SDOperand &Base, SDOperand &Scale,
 784                                   SDOperand &Index, SDOperand &Disp) {
 785   if (N.getOpcode() == ISD::LOAD &&
 786       N.hasOneUse() &&
 787       P.Val->isOnlyUse(N.Val) &&
 788       CanBeFoldedBy(N.Val, P.Val))
 789     return SelectAddr(N.getOperand(1), Base, Scale, Index, Disp);
 790   return false;
 791 }
 792
 793 static bool isRegister0(SDOperand Op) {
 794   if (RegisterSDNode *R = dyn_cast<RegisterSDNode>(Op))
 795     return (R->getReg() == 0);
 796   return false;
 797 }
 798
 799 /// getGlobalBaseReg - Output the instructions required to put the
 800 /// base address to use for accessing globals into a register.
 801 ///
 802 SDNode *X86DAGToDAGISel::getGlobalBaseReg() {
 803   assert(!Subtarget->is64Bit() && "X86-64 PIC uses RIP relative addressing");
 804   if (!GlobalBaseReg) {
 805     // Insert the set of GlobalBaseReg into the first MBB of the function
 806     MachineBasicBlock &FirstMBB = BB->getParent()->front();
 807     MachineBasicBlock::iterator MBBI = FirstMBB.begin();
 808     SSARegMap *RegMap = BB->getParent()->getSSARegMap();
 809     // FIXME: when we get to LP64, we will need to create the appropriate
 810     // type of register here.
 811     GlobalBaseReg = RegMap->createVirtualRegister(X86::GR32RegisterClass);
 812     BuildMI(FirstMBB, MBBI, X86::MovePCtoStack, 0);
 813     BuildMI(FirstMBB, MBBI, X86::POP32r, 1, GlobalBaseReg);
 814   }
 815   return CurDAG->getRegister(GlobalBaseReg, TLI.getPointerTy()).Val;
 816 }
 817
 818 static SDNode *FindCallStartFromCall(SDNode *Node) {
 819   if (Node->getOpcode() == ISD::CALLSEQ_START) return Node;
 820     assert(Node->getOperand(0).getValueType() == MVT::Other &&
 821          "Node doesn't have a token chain argument!");
 822   return FindCallStartFromCall(Node->getOperand(0).Val);
 823 }
 824
 825 SDNode *X86DAGToDAGISel::Select(SDOperand N) {
 826   SDNode *Node = N.Val;
 827   MVT::ValueType NVT = Node->getValueType(0);
 828   unsigned Opc, MOpc;
 829   unsigned Opcode = Node->getOpcode();
 830
 831 #ifndef NDEBUG
 832   DEBUG(std::cerr << std::string(Indent, ' '));
 833   DEBUG(std::cerr << "Selecting: ");
 834   DEBUG(Node->dump(CurDAG));
 835   DEBUG(std::cerr << "\n");
 836   Indent += 2;
 837 #endif
 838
 839   if (Opcode >= ISD::BUILTIN_OP_END && Opcode < X86ISD::FIRST_NUMBER) {
 840 #ifndef NDEBUG
 841     DEBUG(std::cerr << std::string(Indent-2, ' '));
 842     DEBUG(std::cerr << "== ");
 843     DEBUG(Node->dump(CurDAG));
 844     DEBUG(std::cerr << "\n");
 845     Indent -= 2;
 846 #endif
 847     return NULL;   // Already selected.
 848   }
 849
 850   switch (Opcode) {
 851     default: break;
 852     case X86ISD::GlobalBaseReg:
 853       return getGlobalBaseReg();
 854
 855     case ISD::ADD: {
 856       // Turn ADD X, c to MOV32ri X+c. This cannot be done with tblgen'd
 857       // code and is matched first so to prevent it from being turned into
 858       // LEA32r X+c.
 859       // In 64-bit mode, use LEA to take advantage of RIP-relative addressing.
 860       MVT::ValueType PtrVT = TLI.getPointerTy();
 861       SDOperand N0 = N.getOperand(0);
 862       SDOperand N1 = N.getOperand(1);
 863       if (N.Val->getValueType(0) == PtrVT &&
 864           N0.getOpcode() == X86ISD::Wrapper &&
 865           N1.getOpcode() == ISD::Constant) {
 866         unsigned Offset = (unsigned)cast<ConstantSDNode>(N1)->getValue();
 867         SDOperand C(0, 0);
 868         // TODO: handle ExternalSymbolSDNode.
 869         if (GlobalAddressSDNode *G =
 870             dyn_cast<GlobalAddressSDNode>(N0.getOperand(0))) {
 871           C = CurDAG->getTargetGlobalAddress(G->getGlobal(), PtrVT,
 872                                              G->getOffset() + Offset);
 873         } else if (ConstantPoolSDNode *CP =
 874                    dyn_cast<ConstantPoolSDNode>(N0.getOperand(0))) {
 875           C = CurDAG->getTargetConstantPool(CP->getConstVal(), PtrVT,
 876                                             CP->getAlignment(),
 877                                             CP->getOffset()+Offset);
 878         }
 879
 880         if (C.Val) {
 881           if (Subtarget->is64Bit()) {
 882             SDOperand Ops[] = { CurDAG->getRegister(0, PtrVT), getI8Imm(1),
 883                                 CurDAG->getRegister(0, PtrVT), C };
 884             return CurDAG->SelectNodeTo(N.Val, X86::LEA64r, MVT::i64, Ops, 4);
 885           } else
 886             return CurDAG->SelectNodeTo(N.Val, X86::MOV32ri, PtrVT, C);
 887         }
 888       }
 889
 890       // Other cases are handled by auto-generated code.
 891       break;
 892     }
 893
 894     case ISD::MULHU:
 895     case ISD::MULHS: {
 896       if (Opcode == ISD::MULHU)
 897         switch (NVT) {
 898         default: assert(0 && "Unsupported VT!");
 899         case MVT::i8:  Opc = X86::MUL8r;  MOpc = X86::MUL8m;  break;
 900         case MVT::i16: Opc = X86::MUL16r; MOpc = X86::MUL16m; break;
 901         case MVT::i32: Opc = X86::MUL32r; MOpc = X86::MUL32m; break;
 902         case MVT::i64: Opc = X86::MUL64r; MOpc = X86::MUL64m; break;
 903         }
 904       else
 905         switch (NVT) {
 906         default: assert(0 && "Unsupported VT!");
 907         case MVT::i8:  Opc = X86::IMUL8r;  MOpc = X86::IMUL8m;  break;
 908         case MVT::i16: Opc = X86::IMUL16r; MOpc = X86::IMUL16m; break;
 909         case MVT::i32: Opc = X86::IMUL32r; MOpc = X86::IMUL32m; break;
 910         case MVT::i64: Opc = X86::IMUL64r; MOpc = X86::IMUL64m; break;
 911         }
 912
 913       unsigned LoReg, HiReg;
 914       switch (NVT) {
 915       default: assert(0 && "Unsupported VT!");
 916       case MVT::i8:  LoReg = X86::AL;  HiReg = X86::AH;  break;
 917       case MVT::i16: LoReg = X86::AX;  HiReg = X86::DX;  break;
 918       case MVT::i32: LoReg = X86::EAX; HiReg = X86::EDX; break;
 919       case MVT::i64: LoReg = X86::RAX; HiReg = X86::RDX; break;
 920       }
 921
 922       SDOperand N0 = Node->getOperand(0);
 923       SDOperand N1 = Node->getOperand(1);
 924
 925       bool foldedLoad = false;
 926       SDOperand Tmp0, Tmp1, Tmp2, Tmp3;
 927       foldedLoad = TryFoldLoad(N, N1, Tmp0, Tmp1, Tmp2, Tmp3);
 928       // MULHU and MULHS are commmutative
 929       if (!foldedLoad) {
 930         foldedLoad = TryFoldLoad(N, N0, Tmp0, Tmp1, Tmp2, Tmp3);
 931         if (foldedLoad) {
 932           N0 = Node->getOperand(1);
 933           N1 = Node->getOperand(0);
 934         }
 935       }
 936
 937       SDOperand Chain;
 938       if (foldedLoad) {
 939         Chain = N1.getOperand(0);
 940         AddToISelQueue(Chain);
 941       } else
 942         Chain = CurDAG->getEntryNode();
 943
 944       SDOperand InFlag(0, 0);
 945       AddToISelQueue(N0);
 946       Chain  = CurDAG->getCopyToReg(Chain, CurDAG->getRegister(LoReg, NVT),
 947                                     N0, InFlag);
 948       InFlag = Chain.getValue(1);
 949
 950       if (foldedLoad) {
 951         AddToISelQueue(Tmp0);
 952         AddToISelQueue(Tmp1);
 953         AddToISelQueue(Tmp2);
 954         AddToISelQueue(Tmp3);
 955         SDOperand Ops[] = { Tmp0, Tmp1, Tmp2, Tmp3, Chain, InFlag };
 956         SDNode *CNode =
 957           CurDAG->getTargetNode(MOpc, MVT::Other, MVT::Flag, Ops, 6);
 958         Chain  = SDOperand(CNode, 0);
 959         InFlag = SDOperand(CNode, 1);
 960       } else {
 961         AddToISelQueue(N1);
 962         InFlag =
 963           SDOperand(CurDAG->getTargetNode(Opc, MVT::Flag, N1, InFlag), 0);
 964       }
 965
 966       SDOperand Result = CurDAG->getCopyFromReg(Chain, HiReg, NVT, InFlag);
 967       ReplaceUses(N.getValue(0), Result);
 968       if (foldedLoad)
 969         ReplaceUses(N1.getValue(1), Result.getValue(1));
 970
 971 #ifndef NDEBUG
 972       DEBUG(std::cerr << std::string(Indent-2, ' '));
 973       DEBUG(std::cerr << "=> ");
 974       DEBUG(Result.Val->dump(CurDAG));
 975       DEBUG(std::cerr << "\n");
 976       Indent -= 2;
 977 #endif
 978       return NULL;
 979     }
 980
 981     case ISD::SDIV:
 982     case ISD::UDIV:
 983     case ISD::SREM:
 984     case ISD::UREM: {
 985       bool isSigned = Opcode == ISD::SDIV || Opcode == ISD::SREM;
 986       bool isDiv    = Opcode == ISD::SDIV || Opcode == ISD::UDIV;
 987       if (!isSigned)
 988         switch (NVT) {
 989         default: assert(0 && "Unsupported VT!");
 990         case MVT::i8:  Opc = X86::DIV8r;  MOpc = X86::DIV8m;  break;
 991         case MVT::i16: Opc = X86::DIV16r; MOpc = X86::DIV16m; break;
 992         case MVT::i32: Opc = X86::DIV32r; MOpc = X86::DIV32m; break;
 993         case MVT::i64: Opc = X86::DIV64r; MOpc = X86::DIV64m; break;
 994         }
 995       else
 996         switch (NVT) {
 997         default: assert(0 && "Unsupported VT!");
 998         case MVT::i8:  Opc = X86::IDIV8r;  MOpc = X86::IDIV8m;  break;
 999         case MVT::i16: Opc = X86::IDIV16r; MOpc = X86::IDIV16m; break;
1000         case MVT::i32: Opc = X86::IDIV32r; MOpc = X86::IDIV32m; break;
1001         case MVT::i64: Opc = X86::IDIV64r; MOpc = X86::IDIV64m; break;
1002         }
1003
1004       unsigned LoReg, HiReg;
1005       unsigned ClrOpcode, SExtOpcode;
1006       switch (NVT) {
1007       default: assert(0 && "Unsupported VT!");
1008       case MVT::i8:
1009         LoReg = X86::AL;  HiReg = X86::AH;
1010         ClrOpcode  = X86::MOV8r0;
1011         SExtOpcode = X86::CBW;
1012         break;
1013       case MVT::i16:
1014         LoReg = X86::AX;  HiReg = X86::DX;
1015         ClrOpcode  = X86::MOV16r0;
1016         SExtOpcode = X86::CWD;
1017         break;
1018       case MVT::i32:
1019         LoReg = X86::EAX; HiReg = X86::EDX;
1020         ClrOpcode  = X86::MOV32r0;
1021         SExtOpcode = X86::CDQ;
1022         break;
1023       case MVT::i64:
1024         LoReg = X86::RAX; HiReg = X86::RDX;
1025         ClrOpcode  = X86::MOV64r0;
1026         SExtOpcode = X86::CQO;
1027         break;
1028       }
1029
1030       SDOperand N0 = Node->getOperand(0);
1031       SDOperand N1 = Node->getOperand(1);
1032
1033       bool foldedLoad = false;
1034       SDOperand Tmp0, Tmp1, Tmp2, Tmp3;
1035       foldedLoad = TryFoldLoad(N, N1, Tmp0, Tmp1, Tmp2, Tmp3);
1036       SDOperand Chain;
1037       if (foldedLoad) {
1038         Chain = N1.getOperand(0);
1039         AddToISelQueue(Chain);
1040       } else
1041         Chain = CurDAG->getEntryNode();
1042
1043       SDOperand InFlag(0, 0);
1044       AddToISelQueue(N0);
1045       Chain  = CurDAG->getCopyToReg(Chain, CurDAG->getRegister(LoReg, NVT),
1046                                     N0, InFlag);
1047       InFlag = Chain.getValue(1);
1048
1049       if (isSigned) {
1050         // Sign extend the low part into the high part.
1051         InFlag =
1052           SDOperand(CurDAG->getTargetNode(SExtOpcode, MVT::Flag, InFlag), 0);
1053       } else {
1054         // Zero out the high part, effectively zero extending the input.
1055         SDOperand ClrNode = SDOperand(CurDAG->getTargetNode(ClrOpcode, NVT), 0);
1056         Chain  = CurDAG->getCopyToReg(Chain, CurDAG->getRegister(HiReg, NVT),
1057                                       ClrNode, InFlag);
1058         InFlag = Chain.getValue(1);
1059       }
1060
1061       if (foldedLoad) {
1062         AddToISelQueue(Tmp0);
1063         AddToISelQueue(Tmp1);
1064         AddToISelQueue(Tmp2);
1065         AddToISelQueue(Tmp3);
1066         SDOperand Ops[] = { Tmp0, Tmp1, Tmp2, Tmp3, Chain, InFlag };
1067         SDNode *CNode =
1068           CurDAG->getTargetNode(MOpc, MVT::Other, MVT::Flag, Ops, 6);
1069         Chain  = SDOperand(CNode, 0);
1070         InFlag = SDOperand(CNode, 1);
1071       } else {
1072         AddToISelQueue(N1);
1073         InFlag =
1074           SDOperand(CurDAG->getTargetNode(Opc, MVT::Flag, N1, InFlag), 0);
1075       }
1076
1077       SDOperand Result = CurDAG->getCopyFromReg(Chain, isDiv ? LoReg : HiReg,
1078                                                 NVT, InFlag);
1079       ReplaceUses(N.getValue(0), Result);
1080       if (foldedLoad)
1081         ReplaceUses(N1.getValue(1), Result.getValue(1));
1082
1083 #ifndef NDEBUG
1084       DEBUG(std::cerr << std::string(Indent-2, ' '));
1085       DEBUG(std::cerr << "=> ");
1086       DEBUG(Result.Val->dump(CurDAG));
1087       DEBUG(std::cerr << "\n");
1088       Indent -= 2;
1089 #endif
1090
1091       return NULL;
1092     }
1093
1094     case ISD::TRUNCATE: {
1095       if (!Subtarget->is64Bit() && NVT == MVT::i8) {
1096         unsigned Opc2;
1097         MVT::ValueType VT;
1098         switch (Node->getOperand(0).getValueType()) {
1099         default: assert(0 && "Unknown truncate!");
1100         case MVT::i16:
1101           Opc = X86::MOV16to16_;
1102           VT = MVT::i16;
1103           Opc2 = X86::TRUNC_16_to8;
1104           break;
1105         case MVT::i32:
1106           Opc = X86::MOV32to32_;
1107           VT = MVT::i32;
1108           Opc2 = X86::TRUNC_32_to8;
1109           break;
1110         }
1111
1112         AddToISelQueue(Node->getOperand(0));
1113         SDOperand Tmp =
1114           SDOperand(CurDAG->getTargetNode(Opc, VT, Node->getOperand(0)), 0);
1115         SDNode *ResNode = CurDAG->getTargetNode(Opc2, NVT, Tmp);
1116
1117 #ifndef NDEBUG
1118         DEBUG(std::cerr << std::string(Indent-2, ' '));
1119         DEBUG(std::cerr << "=> ");
1120         DEBUG(ResNode->dump(CurDAG));
1121         DEBUG(std::cerr << "\n");
1122         Indent -= 2;
1123 #endif
1124         return ResNode;
1125       }
1126
1127       break;
1128     }
1129   }
1130
1131   SDNode *ResNode = SelectCode(N);
1132
1133 #ifndef NDEBUG
1134   DEBUG(std::cerr << std::string(Indent-2, ' '));
1135   DEBUG(std::cerr << "=> ");
1136   if (ResNode == NULL || ResNode == N.Val)
1137     DEBUG(N.Val->dump(CurDAG));
1138   else
1139     DEBUG(ResNode->dump(CurDAG));
1140   DEBUG(std::cerr << "\n");
1141   Indent -= 2;
1142 #endif
1143
1144   return ResNode;
1145 }
1146
1147 bool X86DAGToDAGISel::
1148 SelectInlineAsmMemoryOperand(const SDOperand &Op, char ConstraintCode,
1149                              std::vector<SDOperand> &OutOps, SelectionDAG &DAG){
1150   SDOperand Op0, Op1, Op2, Op3;
1151   switch (ConstraintCode) {
1152   case 'o':   // offsetable        ??
1153   case 'v':   // not offsetable    ??
1154   default: return true;
1155   case 'm':   // memory
1156     if (!SelectAddr(Op, Op0, Op1, Op2, Op3))
1157       return true;
1158     break;
1159   }
1160
1161   OutOps.push_back(Op0);
1162   OutOps.push_back(Op1);
1163   OutOps.push_back(Op2);
1164   OutOps.push_back(Op3);
1165   AddToISelQueue(Op0);
1166   AddToISelQueue(Op1);
1167   AddToISelQueue(Op2);
1168   AddToISelQueue(Op3);
1169   return false;
1170 }
1171
1172 /// createX86ISelDag - This pass converts a legalized DAG into a
1173 /// X86-specific DAG, ready for instruction scheduling.
1174 ///
1175 FunctionPass *llvm::createX86ISelDag(X86TargetMachine &TM, bool Fast) {
1176   return new X86DAGToDAGISel(TM, Fast);
1177 }