1 //===-- PPC64ISelPattern.cpp - A pattern matching inst selector for PPC64 -===//
3 // The LLVM Compiler Infrastructure
5 // This file was developed by Nate Begeman and is distributed under
6 // the University of Illinois Open Source License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file defines a pattern matching instruction selector for 64 bit PowerPC.
12 //===----------------------------------------------------------------------===//
15 #include "PowerPCInstrBuilder.h"
16 #include "PowerPCInstrInfo.h"
17 #include "PPC64RegisterInfo.h"
18 #include "llvm/Constants.h" // FIXME: REMOVE
19 #include "llvm/Function.h"
20 #include "llvm/CodeGen/MachineConstantPool.h" // FIXME: REMOVE
21 #include "llvm/CodeGen/MachineFunction.h"
22 #include "llvm/CodeGen/MachineFrameInfo.h"
23 #include "llvm/CodeGen/SelectionDAG.h"
24 #include "llvm/CodeGen/SelectionDAGISel.h"
25 #include "llvm/CodeGen/SSARegMap.h"
26 #include "llvm/Target/TargetData.h"
27 #include "llvm/Target/TargetLowering.h"
28 #include "llvm/Target/TargetOptions.h"
29 #include "llvm/Support/Debug.h"
30 #include "llvm/Support/MathExtras.h"
31 #include "llvm/ADT/Statistic.h"
36 //===----------------------------------------------------------------------===//
37 // PPC32TargetLowering - PPC32 Implementation of the TargetLowering interface
39 class PPC64TargetLowering : public TargetLowering {
40 int VarArgsFrameIndex; // FrameIndex for start of varargs area.
41 int ReturnAddrIndex; // FrameIndex for return slot.
43 PPC64TargetLowering(TargetMachine &TM) : TargetLowering(TM) {
44 // Set up the register classes.
45 addRegisterClass(MVT::i64, PPC64::GPRCRegisterClass);
46 addRegisterClass(MVT::f32, PPC64::FPRCRegisterClass);
47 addRegisterClass(MVT::f64, PPC64::FPRCRegisterClass);
49 // PowerPC has no intrinsics for these particular operations
50 setOperationAction(ISD::BRCONDTWOWAY, MVT::Other, Expand);
51 setOperationAction(ISD::MEMMOVE, MVT::Other, Expand);
52 setOperationAction(ISD::MEMSET, MVT::Other, Expand);
53 setOperationAction(ISD::MEMCPY, MVT::Other, Expand);
55 // We don't support sin/cos/sqrt
56 setOperationAction(ISD::FSIN , MVT::f64, Expand);
57 setOperationAction(ISD::FCOS , MVT::f64, Expand);
58 setOperationAction(ISD::FSQRT, MVT::f64, Expand);
59 setOperationAction(ISD::FSIN , MVT::f32, Expand);
60 setOperationAction(ISD::FCOS , MVT::f32, Expand);
61 setOperationAction(ISD::FSQRT, MVT::f32, Expand);
63 // PPC 64 has i16 and i32 but no i8 (or i1) SEXTLOAD
64 setOperationAction(ISD::SEXTLOAD, MVT::i1, Expand);
65 setOperationAction(ISD::SEXTLOAD, MVT::i8, Expand);
67 // PowerPC has no SREM/UREM instructions
68 setOperationAction(ISD::SREM, MVT::i64, Expand);
69 setOperationAction(ISD::UREM, MVT::i64, Expand);
71 // PowerPC has these, but they are not implemented
72 setOperationAction(ISD::CTPOP, MVT::i64, Expand);
73 setOperationAction(ISD::CTTZ , MVT::i64, Expand);
74 setOperationAction(ISD::CTLZ , MVT::i64, Expand);
76 setShiftAmountFlavor(Extend); // shl X, 32 == 0
77 addLegalFPImmediate(+0.0); // Necessary for FSEL
78 addLegalFPImmediate(-0.0); //
80 computeRegisterProperties();
83 /// LowerArguments - This hook must be implemented to indicate how we should
84 /// lower the arguments for the specified function, into the specified DAG.
85 virtual std::vector<SDOperand>
86 LowerArguments(Function &F, SelectionDAG &DAG);
88 /// LowerCallTo - This hook lowers an abstract call to a function into an
90 virtual std::pair<SDOperand, SDOperand>
91 LowerCallTo(SDOperand Chain, const Type *RetTy, bool isVarArg,
92 SDOperand Callee, ArgListTy &Args, SelectionDAG &DAG);
94 virtual std::pair<SDOperand, SDOperand>
95 LowerVAStart(SDOperand Chain, SelectionDAG &DAG);
97 virtual std::pair<SDOperand,SDOperand>
98 LowerVAArgNext(bool isVANext, SDOperand Chain, SDOperand VAList,
99 const Type *ArgTy, SelectionDAG &DAG);
101 virtual std::pair<SDOperand, SDOperand>
102 LowerFrameReturnAddress(bool isFrameAddr, SDOperand Chain, unsigned Depth,
108 std::vector<SDOperand>
109 PPC64TargetLowering::LowerArguments(Function &F, SelectionDAG &DAG) {
111 // add beautiful description of PPC stack frame format, or at least some docs
113 MachineFunction &MF = DAG.getMachineFunction();
114 MachineFrameInfo *MFI = MF.getFrameInfo();
115 MachineBasicBlock& BB = MF.front();
116 std::vector<SDOperand> ArgValues;
118 // Due to the rather complicated nature of the PowerPC ABI, rather than a
119 // fixed size array of physical args, for the sake of simplicity let the STL
120 // handle tracking them for us.
121 std::vector<unsigned> argVR, argPR, argOp;
122 unsigned ArgOffset = 48;
123 unsigned GPR_remaining = 8;
124 unsigned FPR_remaining = 13;
125 unsigned GPR_idx = 0, FPR_idx = 0;
126 static const unsigned GPR[] = {
127 PPC::R3, PPC::R4, PPC::R5, PPC::R6,
128 PPC::R7, PPC::R8, PPC::R9, PPC::R10,
130 static const unsigned FPR[] = {
131 PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,
132 PPC::F8, PPC::F9, PPC::F10, PPC::F11, PPC::F12, PPC::F13
135 // Add DAG nodes to load the arguments... On entry to a function on PPC,
136 // the arguments start at offset 48, although they are likely to be passed
138 for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end(); I != E; ++I) {
139 SDOperand newroot, argt;
140 bool needsLoad = false;
141 MVT::ValueType ObjectVT = getValueType(I->getType());
144 default: assert(0 && "Unhandled argument type!");
150 if (GPR_remaining > 0) {
151 BuildMI(&BB, PPC::IMPLICIT_DEF, 0, GPR[GPR_idx]);
152 argt = newroot = DAG.getCopyFromReg(GPR[GPR_idx], MVT::i32,
154 if (ObjectVT != MVT::i64)
155 argt = DAG.getNode(ISD::TRUNCATE, ObjectVT, newroot);
162 if (FPR_remaining > 0) {
163 BuildMI(&BB, PPC::IMPLICIT_DEF, 0, FPR[FPR_idx]);
164 argt = newroot = DAG.getCopyFromReg(FPR[FPR_idx], ObjectVT,
174 // We need to load the argument to a virtual register if we determined above
175 // that we ran out of physical registers of the appropriate type
177 unsigned SubregOffset = 0;
179 default: assert(0 && "Unhandled argument type!");
181 case MVT::i8: SubregOffset = 7; break;
182 case MVT::i16: SubregOffset = 6; break;
184 case MVT::f32: SubregOffset = 4; break;
186 case MVT::f64: SubregOffset = 0; break;
188 int FI = MFI->CreateFixedObject(8, ArgOffset);
189 SDOperand FIN = DAG.getFrameIndex(FI, MVT::i64);
190 FIN = DAG.getNode(ISD::ADD, MVT::i64, FIN,
191 DAG.getConstant(SubregOffset, MVT::i64));
192 argt = newroot = DAG.getLoad(ObjectVT, DAG.getEntryNode(), FIN, DAG.getSrcValue(NULL));
195 // Every 4 bytes of argument space consumes one of the GPRs available for
197 if (GPR_remaining > 0) {
203 DAG.setRoot(newroot.getValue(1));
204 ArgValues.push_back(argt);
207 // If the function takes variable number of arguments, make a frame index for
208 // the start of the first vararg value... for expansion of llvm.va_start.
210 VarArgsFrameIndex = MFI->CreateFixedObject(8, ArgOffset);
211 SDOperand FIN = DAG.getFrameIndex(VarArgsFrameIndex, MVT::i64);
212 // If this function is vararg, store any remaining integer argument regs
213 // to their spots on the stack so that they may be loaded by deferencing the
214 // result of va_next.
215 std::vector<SDOperand> MemOps;
216 for (; GPR_remaining > 0; --GPR_remaining, ++GPR_idx) {
217 BuildMI(&BB, PPC::IMPLICIT_DEF, 0, GPR[GPR_idx]);
218 SDOperand Val = DAG.getCopyFromReg(GPR[GPR_idx], MVT::i64, DAG.getRoot());
219 SDOperand Store = DAG.getNode(ISD::STORE, MVT::Other, Val.getValue(1),
220 Val, FIN, DAG.getSrcValue(NULL));
221 MemOps.push_back(Store);
222 // Increment the address by eight for the next argument to store
223 SDOperand PtrOff = DAG.getConstant(8, getPointerTy());
224 FIN = DAG.getNode(ISD::ADD, MVT::i32, FIN, PtrOff);
226 DAG.setRoot(DAG.getNode(ISD::TokenFactor, MVT::Other, MemOps));
232 std::pair<SDOperand, SDOperand>
233 PPC64TargetLowering::LowerCallTo(SDOperand Chain,
234 const Type *RetTy, bool isVarArg,
235 SDOperand Callee, ArgListTy &Args,
237 // args_to_use will accumulate outgoing args for the ISD::CALL case in
238 // SelectExpr to use to put the arguments in the appropriate registers.
239 std::vector<SDOperand> args_to_use;
241 // Count how many bytes are to be pushed on the stack, including the linkage
242 // area, and parameter passing area.
243 unsigned NumBytes = 48;
246 Chain = DAG.getNode(ISD::ADJCALLSTACKDOWN, MVT::Other, Chain,
247 DAG.getConstant(NumBytes, getPointerTy()));
249 NumBytes = 8 * Args.size(); // All arguments are rounded up to 8 bytes
251 // Just to be safe, we'll always reserve the full 48 bytes of linkage area
252 // plus 64 bytes of argument space in case any called code gets funky on us.
253 if (NumBytes < 112) NumBytes = 112;
255 // Adjust the stack pointer for the new arguments...
256 // These operations are automatically eliminated by the prolog/epilog pass
257 Chain = DAG.getNode(ISD::ADJCALLSTACKDOWN, MVT::Other, Chain,
258 DAG.getConstant(NumBytes, getPointerTy()));
260 // Set up a copy of the stack pointer for use loading and storing any
261 // arguments that may not fit in the registers available for argument
263 SDOperand StackPtr = DAG.getCopyFromReg(PPC::R1, MVT::i32,
266 // Figure out which arguments are going to go in registers, and which in
267 // memory. Also, if this is a vararg function, floating point operations
268 // must be stored to our stack, and loaded into integer regs as well, if
269 // any integer regs are available for argument passing.
270 unsigned ArgOffset = 48;
271 unsigned GPR_remaining = 8;
272 unsigned FPR_remaining = 13;
274 std::vector<SDOperand> MemOps;
275 for (unsigned i = 0, e = Args.size(); i != e; ++i) {
276 // PtrOff will be used to store the current argument to the stack if a
277 // register cannot be found for it.
278 SDOperand PtrOff = DAG.getConstant(ArgOffset, getPointerTy());
279 PtrOff = DAG.getNode(ISD::ADD, MVT::i32, StackPtr, PtrOff);
280 MVT::ValueType ArgVT = getValueType(Args[i].second);
283 default: assert(0 && "Unexpected ValueType for argument!");
288 // Promote the integer to 64 bits. If the input type is signed use a
289 // sign extend, otherwise use a zero extend.
290 if (Args[i].second->isSigned())
291 Args[i].first =DAG.getNode(ISD::SIGN_EXTEND, MVT::i64, Args[i].first);
293 Args[i].first =DAG.getNode(ISD::ZERO_EXTEND, MVT::i64, Args[i].first);
296 if (GPR_remaining > 0) {
297 args_to_use.push_back(Args[i].first);
300 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
301 Args[i].first, PtrOff, DAG.getSrcValue(NULL)));
307 if (FPR_remaining > 0) {
308 args_to_use.push_back(Args[i].first);
311 SDOperand Store = DAG.getNode(ISD::STORE, MVT::Other, Chain,
312 Args[i].first, PtrOff, DAG.getSrcValue(NULL));
313 MemOps.push_back(Store);
314 // Float varargs are always shadowed in available integer registers
315 if (GPR_remaining > 0) {
316 SDOperand Load = DAG.getLoad(MVT::i64, Store, PtrOff, DAG.getSrcValue(NULL));
317 MemOps.push_back(Load);
318 args_to_use.push_back(Load);
322 // If we have any FPRs remaining, we may also have GPRs remaining.
323 // Args passed in FPRs also consume an available GPR.
324 if (GPR_remaining > 0) {
325 args_to_use.push_back(DAG.getNode(ISD::UNDEF, MVT::i64));
330 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
331 Args[i].first, PtrOff, DAG.getSrcValue(NULL)));
338 Chain = DAG.getNode(ISD::TokenFactor, MVT::Other, MemOps);
341 std::vector<MVT::ValueType> RetVals;
342 MVT::ValueType RetTyVT = getValueType(RetTy);
343 if (RetTyVT != MVT::isVoid)
344 RetVals.push_back(RetTyVT);
345 RetVals.push_back(MVT::Other);
347 SDOperand TheCall = SDOperand(DAG.getCall(RetVals,
348 Chain, Callee, args_to_use), 0);
349 Chain = TheCall.getValue(RetTyVT != MVT::isVoid);
350 Chain = DAG.getNode(ISD::ADJCALLSTACKUP, MVT::Other, Chain,
351 DAG.getConstant(NumBytes, getPointerTy()));
352 return std::make_pair(TheCall, Chain);
355 std::pair<SDOperand, SDOperand>
356 PPC64TargetLowering::LowerVAStart(SDOperand Chain, SelectionDAG &DAG) {
357 //vastart just returns the address of the VarArgsFrameIndex slot.
358 return std::make_pair(DAG.getFrameIndex(VarArgsFrameIndex, MVT::i64), Chain);
361 std::pair<SDOperand,SDOperand> PPC64TargetLowering::
362 LowerVAArgNext(bool isVANext, SDOperand Chain, SDOperand VAList,
363 const Type *ArgTy, SelectionDAG &DAG) {
364 MVT::ValueType ArgVT = getValueType(ArgTy);
367 Result = DAG.getLoad(ArgVT, DAG.getEntryNode(), VAList, DAG.getSrcValue(NULL));
369 Result = DAG.getNode(ISD::ADD, VAList.getValueType(), VAList,
370 DAG.getConstant(8, VAList.getValueType()));
372 return std::make_pair(Result, Chain);
376 std::pair<SDOperand, SDOperand> PPC64TargetLowering::
377 LowerFrameReturnAddress(bool isFrameAddress, SDOperand Chain, unsigned Depth,
379 assert(0 && "LowerFrameReturnAddress unimplemented");
384 Statistic<>NotLogic("ppc-codegen", "Number of inverted logical ops");
385 Statistic<>FusedFP("ppc-codegen", "Number of fused fp operations");
386 //===--------------------------------------------------------------------===//
387 /// ISel - PPC32 specific code to select PPC32 machine instructions for
388 /// SelectionDAG operations.
389 //===--------------------------------------------------------------------===//
390 class ISel : public SelectionDAGISel {
393 PPC64TargetLowering PPC64Lowering;
395 /// ExprMap - As shared expressions are codegen'd, we keep track of which
396 /// vreg the value is produced in, so we only emit one copy of each compiled
398 std::map<SDOperand, unsigned> ExprMap;
400 unsigned GlobalBaseReg;
401 bool GlobalBaseInitialized;
404 ISel(TargetMachine &TM) : SelectionDAGISel(PPC64Lowering), PPC64Lowering(TM)
407 /// runOnFunction - Override this function in order to reset our per-function
409 virtual bool runOnFunction(Function &Fn) {
410 // Make sure we re-emit a set of the global base reg if necessary
411 GlobalBaseInitialized = false;
412 return SelectionDAGISel::runOnFunction(Fn);
415 /// InstructionSelectBasicBlock - This callback is invoked by
416 /// SelectionDAGISel when it has created a SelectionDAG for us to codegen.
417 virtual void InstructionSelectBasicBlock(SelectionDAG &DAG) {
419 // Codegen the basic block.
420 Select(DAG.getRoot());
422 // Clear state used for selection.
426 unsigned getGlobalBaseReg();
427 unsigned getConstDouble(double floatVal, unsigned Result);
428 unsigned SelectSetCR0(SDOperand CC);
429 unsigned SelectExpr(SDOperand N);
430 unsigned SelectExprFP(SDOperand N, unsigned Result);
431 void Select(SDOperand N);
433 bool SelectAddr(SDOperand N, unsigned& Reg, int& offset);
434 void SelectBranchCC(SDOperand N);
437 /// ExactLog2 - This function solves for (Val == 1 << (N-1)) and returns N. It
438 /// returns zero when the input is not exactly a power of two.
439 static unsigned ExactLog2(unsigned Val) {
440 if (Val == 0 || (Val & (Val-1))) return 0;
449 /// getImmediateForOpcode - This method returns a value indicating whether
450 /// the ConstantSDNode N can be used as an immediate to Opcode. The return
451 /// values are either 0, 1 or 2. 0 indicates that either N is not a
452 /// ConstantSDNode, or is not suitable for use by that opcode. A return value
453 /// of 1 indicates that the constant may be used in normal immediate form. A
454 /// return value of 2 indicates that the constant may be used in shifted
455 /// immediate form. A return value of 3 indicates that log base 2 of the
456 /// constant may be used.
458 static unsigned getImmediateForOpcode(SDOperand N, unsigned Opcode,
459 unsigned& Imm, bool U = false) {
460 if (N.getOpcode() != ISD::Constant) return 0;
462 int v = (int)cast<ConstantSDNode>(N)->getSignExtended();
467 if (v <= 32767 && v >= -32768) { Imm = v & 0xFFFF; return 1; }
468 if ((v & 0x0000FFFF) == 0) { Imm = v >> 16; return 2; }
473 if (v >= 0 && v <= 65535) { Imm = v & 0xFFFF; return 1; }
474 if ((v & 0x0000FFFF) == 0) { Imm = v >> 16; return 2; }
478 if (v <= 32767 && v >= -32768) { Imm = v & 0xFFFF; return 1; }
481 if (U && (v >= 0 && v <= 65535)) { Imm = v & 0xFFFF; return 1; }
482 if (!U && (v <= 32767 && v >= -32768)) { Imm = v & 0xFFFF; return 1; }
485 if ((Imm = ExactLog2(v))) { return 3; }
491 /// getBCCForSetCC - Returns the PowerPC condition branch mnemonic corresponding
492 /// to Condition. If the Condition is unordered or unsigned, the bool argument
493 /// U is set to true, otherwise it is set to false.
494 static unsigned getBCCForSetCC(unsigned Condition, bool& U) {
497 default: assert(0 && "Unknown condition!"); abort();
498 case ISD::SETEQ: return PPC::BEQ;
499 case ISD::SETNE: return PPC::BNE;
500 case ISD::SETULT: U = true;
501 case ISD::SETLT: return PPC::BLT;
502 case ISD::SETULE: U = true;
503 case ISD::SETLE: return PPC::BLE;
504 case ISD::SETUGT: U = true;
505 case ISD::SETGT: return PPC::BGT;
506 case ISD::SETUGE: U = true;
507 case ISD::SETGE: return PPC::BGE;
512 /// IndexedOpForOp - Return the indexed variant for each of the PowerPC load
513 /// and store immediate instructions.
514 static unsigned IndexedOpForOp(unsigned Opcode) {
516 default: assert(0 && "Unknown opcode!"); abort();
517 case PPC::LBZ: return PPC::LBZX; case PPC::STB: return PPC::STBX;
518 case PPC::LHZ: return PPC::LHZX; case PPC::STH: return PPC::STHX;
519 case PPC::LHA: return PPC::LHAX; case PPC::STW: return PPC::STWX;
520 case PPC::LWZ: return PPC::LWZX; case PPC::STD: return PPC::STDX;
521 case PPC::LD: return PPC::LDX; case PPC::STFS: return PPC::STFSX;
522 case PPC::LFS: return PPC::LFSX; case PPC::STFD: return PPC::STFDX;
523 case PPC::LFD: return PPC::LFDX;
529 /// getGlobalBaseReg - Output the instructions required to put the
530 /// base address to use for accessing globals into a register.
532 unsigned ISel::getGlobalBaseReg() {
533 if (!GlobalBaseInitialized) {
534 // Insert the set of GlobalBaseReg into the first MBB of the function
535 MachineBasicBlock &FirstMBB = BB->getParent()->front();
536 MachineBasicBlock::iterator MBBI = FirstMBB.begin();
537 GlobalBaseReg = MakeReg(MVT::i64);
538 BuildMI(FirstMBB, MBBI, PPC::MovePCtoLR, 0, PPC::LR);
539 BuildMI(FirstMBB, MBBI, PPC::MFLR, 1, GlobalBaseReg).addReg(PPC::LR);
540 GlobalBaseInitialized = true;
542 return GlobalBaseReg;
545 /// getConstDouble - Loads a floating point value into a register, via the
546 /// Constant Pool. Optionally takes a register in which to load the value.
547 unsigned ISel::getConstDouble(double doubleVal, unsigned Result=0) {
548 unsigned Tmp1 = MakeReg(MVT::i64);
549 if (0 == Result) Result = MakeReg(MVT::f64);
550 MachineConstantPool *CP = BB->getParent()->getConstantPool();
551 ConstantFP *CFP = ConstantFP::get(Type::DoubleTy, doubleVal);
552 unsigned CPI = CP->getConstantPoolIndex(CFP);
553 BuildMI(BB, PPC::LOADHiAddr, 2, Tmp1).addReg(getGlobalBaseReg())
554 .addConstantPoolIndex(CPI);
555 BuildMI(BB, PPC::LFD, 2, Result).addConstantPoolIndex(CPI).addReg(Tmp1);
559 unsigned ISel::SelectSetCR0(SDOperand CC) {
560 unsigned Opc, Tmp1, Tmp2;
561 static const unsigned CompareOpcodes[] =
562 { PPC::FCMPU, PPC::FCMPU, PPC::CMPW, PPC::CMPLW };
564 // If the first operand to the select is a SETCC node, then we can fold it
565 // into the branch that selects which value to return.
566 SetCCSDNode* SetCC = dyn_cast<SetCCSDNode>(CC.Val);
567 if (SetCC && CC.getOpcode() == ISD::SETCC) {
569 Opc = getBCCForSetCC(SetCC->getCondition(), U);
570 Tmp1 = SelectExpr(SetCC->getOperand(0));
572 // Pass the optional argument U to getImmediateForOpcode for SETCC,
573 // so that it knows whether the SETCC immediate range is signed or not.
574 if (1 == getImmediateForOpcode(SetCC->getOperand(1), ISD::SETCC,
577 BuildMI(BB, PPC::CMPLWI, 2, PPC::CR0).addReg(Tmp1).addImm(Tmp2);
579 BuildMI(BB, PPC::CMPWI, 2, PPC::CR0).addReg(Tmp1).addSImm(Tmp2);
581 bool IsInteger = MVT::isInteger(SetCC->getOperand(0).getValueType());
582 unsigned CompareOpc = CompareOpcodes[2 * IsInteger + U];
583 Tmp2 = SelectExpr(SetCC->getOperand(1));
584 BuildMI(BB, CompareOpc, 2, PPC::CR0).addReg(Tmp1).addReg(Tmp2);
587 Tmp1 = SelectExpr(CC);
588 BuildMI(BB, PPC::CMPLWI, 2, PPC::CR0).addReg(Tmp1).addImm(0);
594 /// Check to see if the load is a constant offset from a base register
595 bool ISel::SelectAddr(SDOperand N, unsigned& Reg, int& offset)
597 unsigned imm = 0, opcode = N.getOpcode();
598 if (N.getOpcode() == ISD::ADD) {
599 Reg = SelectExpr(N.getOperand(0));
600 if (1 == getImmediateForOpcode(N.getOperand(1), opcode, imm)) {
604 offset = SelectExpr(N.getOperand(1));
612 void ISel::SelectBranchCC(SDOperand N)
614 assert(N.getOpcode() == ISD::BRCOND && "Not a BranchCC???");
615 MachineBasicBlock *Dest =
616 cast<BasicBlockSDNode>(N.getOperand(2))->getBasicBlock();
618 // Get the MBB we will fall through to so that we can hand it off to the
619 // branch selection pass as an argument to the PPC::COND_BRANCH pseudo op.
620 //ilist<MachineBasicBlock>::iterator It = BB;
621 //MachineBasicBlock *Fallthrough = ++It;
623 Select(N.getOperand(0)); //chain
624 unsigned Opc = SelectSetCR0(N.getOperand(1));
625 // FIXME: Use this once we have something approximating two-way branches
626 // We cannot currently use this in case the ISel hands us something like
629 // since the fallthrough basic block for the conditional branch does not start
630 // with the unconditional branch (it is skipped over).
631 //BuildMI(BB, PPC::COND_BRANCH, 4).addReg(PPC::CR0).addImm(Opc)
632 // .addMBB(Dest).addMBB(Fallthrough);
633 BuildMI(BB, Opc, 2).addReg(PPC::CR0).addMBB(Dest);
637 unsigned ISel::SelectExprFP(SDOperand N, unsigned Result)
639 unsigned Tmp1, Tmp2, Tmp3;
641 SDNode *Node = N.Val;
642 MVT::ValueType DestType = N.getValueType();
643 unsigned opcode = N.getOpcode();
648 assert(0 && "Node not handled!\n");
651 // Attempt to generate FSEL. We can do this whenever we have an FP result,
652 // and an FP comparison in the SetCC node.
653 SetCCSDNode* SetCC = dyn_cast<SetCCSDNode>(N.getOperand(0).Val);
654 if (SetCC && N.getOperand(0).getOpcode() == ISD::SETCC &&
655 !MVT::isInteger(SetCC->getOperand(0).getValueType()) &&
656 SetCC->getCondition() != ISD::SETEQ &&
657 SetCC->getCondition() != ISD::SETNE) {
658 MVT::ValueType VT = SetCC->getOperand(0).getValueType();
659 Tmp1 = SelectExpr(SetCC->getOperand(0)); // Val to compare against
660 unsigned TV = SelectExpr(N.getOperand(1)); // Use if TRUE
661 unsigned FV = SelectExpr(N.getOperand(2)); // Use if FALSE
663 ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(SetCC->getOperand(1));
664 if (CN && (CN->isExactlyValue(-0.0) || CN->isExactlyValue(0.0))) {
665 switch(SetCC->getCondition()) {
666 default: assert(0 && "Invalid FSEL condition"); abort();
669 BuildMI(BB, PPC::FSEL, 3, Result).addReg(Tmp1).addReg(FV).addReg(TV);
673 BuildMI(BB, PPC::FSEL, 3, Result).addReg(Tmp1).addReg(TV).addReg(FV);
678 BuildMI(BB, PPC::FNEG, 1, Tmp2).addReg(Tmp1);
679 BuildMI(BB, PPC::FSEL, 3, Result).addReg(Tmp2).addReg(FV).addReg(TV);
685 BuildMI(BB, PPC::FNEG, 1, Tmp2).addReg(Tmp1);
686 BuildMI(BB, PPC::FSEL, 3, Result).addReg(Tmp2).addReg(TV).addReg(FV);
691 Opc = (MVT::f64 == VT) ? PPC::FSUB : PPC::FSUBS;
692 Tmp2 = SelectExpr(SetCC->getOperand(1));
694 switch(SetCC->getCondition()) {
695 default: assert(0 && "Invalid FSEL condition"); abort();
698 BuildMI(BB, Opc, 2, Tmp3).addReg(Tmp1).addReg(Tmp2);
699 BuildMI(BB, PPC::FSEL, 3, Result).addReg(Tmp3).addReg(FV).addReg(TV);
703 BuildMI(BB, Opc, 2, Tmp3).addReg(Tmp1).addReg(Tmp2);
704 BuildMI(BB, PPC::FSEL, 3, Result).addReg(Tmp3).addReg(TV).addReg(FV);
708 BuildMI(BB, Opc, 2, Tmp3).addReg(Tmp2).addReg(Tmp1);
709 BuildMI(BB, PPC::FSEL, 3, Result).addReg(Tmp3).addReg(FV).addReg(TV);
713 BuildMI(BB, Opc, 2, Tmp3).addReg(Tmp2).addReg(Tmp1);
714 BuildMI(BB, PPC::FSEL, 3, Result).addReg(Tmp3).addReg(TV).addReg(FV);
718 assert(0 && "Should never get here");
722 unsigned TrueValue = SelectExpr(N.getOperand(1)); //Use if TRUE
723 unsigned FalseValue = SelectExpr(N.getOperand(2)); //Use if FALSE
724 Opc = SelectSetCR0(N.getOperand(0));
726 // Create an iterator with which to insert the MBB for copying the false
727 // value and the MBB to hold the PHI instruction for this SetCC.
728 MachineBasicBlock *thisMBB = BB;
729 const BasicBlock *LLVM_BB = BB->getBasicBlock();
730 ilist<MachineBasicBlock>::iterator It = BB;
738 // fallthrough --> copy0MBB
739 MachineBasicBlock *copy0MBB = new MachineBasicBlock(LLVM_BB);
740 MachineBasicBlock *sinkMBB = new MachineBasicBlock(LLVM_BB);
741 BuildMI(BB, Opc, 2).addReg(PPC::CR0).addMBB(sinkMBB);
742 MachineFunction *F = BB->getParent();
743 F->getBasicBlockList().insert(It, copy0MBB);
744 F->getBasicBlockList().insert(It, sinkMBB);
745 // Update machine-CFG edges
746 BB->addSuccessor(copy0MBB);
747 BB->addSuccessor(sinkMBB);
751 // # fallthrough to sinkMBB
753 // Update machine-CFG edges
754 BB->addSuccessor(sinkMBB);
757 // %Result = phi [ %FalseValue, copy0MBB ], [ %TrueValue, thisMBB ]
760 BuildMI(BB, PPC::PHI, 4, Result).addReg(FalseValue)
761 .addMBB(copy0MBB).addReg(TrueValue).addMBB(thisMBB);
766 if (!NoExcessFPPrecision &&
767 ISD::ADD == N.getOperand(0).getOpcode() &&
768 N.getOperand(0).Val->hasOneUse() &&
769 ISD::MUL == N.getOperand(0).getOperand(0).getOpcode() &&
770 N.getOperand(0).getOperand(0).Val->hasOneUse()) {
771 ++FusedFP; // Statistic
772 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0).getOperand(0));
773 Tmp2 = SelectExpr(N.getOperand(0).getOperand(0).getOperand(1));
774 Tmp3 = SelectExpr(N.getOperand(0).getOperand(1));
775 Opc = DestType == MVT::f64 ? PPC::FNMADD : PPC::FNMADDS;
776 BuildMI(BB, Opc, 3, Result).addReg(Tmp1).addReg(Tmp2).addReg(Tmp3);
777 } else if (!NoExcessFPPrecision &&
778 ISD::SUB == N.getOperand(0).getOpcode() &&
779 N.getOperand(0).Val->hasOneUse() &&
780 ISD::MUL == N.getOperand(0).getOperand(0).getOpcode() &&
781 N.getOperand(0).getOperand(0).Val->hasOneUse()) {
782 ++FusedFP; // Statistic
783 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0).getOperand(0));
784 Tmp2 = SelectExpr(N.getOperand(0).getOperand(0).getOperand(1));
785 Tmp3 = SelectExpr(N.getOperand(0).getOperand(1));
786 Opc = DestType == MVT::f64 ? PPC::FNMSUB : PPC::FNMSUBS;
787 BuildMI(BB, Opc, 3, Result).addReg(Tmp1).addReg(Tmp2).addReg(Tmp3);
788 } else if (ISD::FABS == N.getOperand(0).getOpcode()) {
789 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
790 BuildMI(BB, PPC::FNABS, 1, Result).addReg(Tmp1);
792 Tmp1 = SelectExpr(N.getOperand(0));
793 BuildMI(BB, PPC::FNEG, 1, Result).addReg(Tmp1);
798 Tmp1 = SelectExpr(N.getOperand(0));
799 BuildMI(BB, PPC::FABS, 1, Result).addReg(Tmp1);
803 assert (DestType == MVT::f32 &&
804 N.getOperand(0).getValueType() == MVT::f64 &&
805 "only f64 to f32 conversion supported here");
806 Tmp1 = SelectExpr(N.getOperand(0));
807 BuildMI(BB, PPC::FRSP, 1, Result).addReg(Tmp1);
811 assert (DestType == MVT::f64 &&
812 N.getOperand(0).getValueType() == MVT::f32 &&
813 "only f32 to f64 conversion supported here");
814 Tmp1 = SelectExpr(N.getOperand(0));
815 BuildMI(BB, PPC::FMR, 1, Result).addReg(Tmp1);
818 case ISD::CopyFromReg:
820 Result = ExprMap[N.getValue(0)] = MakeReg(N.getValue(0).getValueType());
821 Tmp1 = dyn_cast<RegSDNode>(Node)->getReg();
822 BuildMI(BB, PPC::FMR, 1, Result).addReg(Tmp1);
825 case ISD::ConstantFP: {
826 ConstantFPSDNode *CN = cast<ConstantFPSDNode>(N);
827 Result = getConstDouble(CN->getValue(), Result);
832 if (!NoExcessFPPrecision && N.getOperand(0).getOpcode() == ISD::MUL &&
833 N.getOperand(0).Val->hasOneUse()) {
834 ++FusedFP; // Statistic
835 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
836 Tmp2 = SelectExpr(N.getOperand(0).getOperand(1));
837 Tmp3 = SelectExpr(N.getOperand(1));
838 Opc = DestType == MVT::f64 ? PPC::FMADD : PPC::FMADDS;
839 BuildMI(BB, Opc, 3, Result).addReg(Tmp1).addReg(Tmp2).addReg(Tmp3);
842 Opc = DestType == MVT::f64 ? PPC::FADD : PPC::FADDS;
843 Tmp1 = SelectExpr(N.getOperand(0));
844 Tmp2 = SelectExpr(N.getOperand(1));
845 BuildMI(BB, Opc, 2, Result).addReg(Tmp1).addReg(Tmp2);
849 if (!NoExcessFPPrecision && N.getOperand(0).getOpcode() == ISD::MUL &&
850 N.getOperand(0).Val->hasOneUse()) {
851 ++FusedFP; // Statistic
852 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
853 Tmp2 = SelectExpr(N.getOperand(0).getOperand(1));
854 Tmp3 = SelectExpr(N.getOperand(1));
855 Opc = DestType == MVT::f64 ? PPC::FMSUB : PPC::FMSUBS;
856 BuildMI(BB, Opc, 3, Result).addReg(Tmp1).addReg(Tmp2).addReg(Tmp3);
859 Opc = DestType == MVT::f64 ? PPC::FSUB : PPC::FSUBS;
860 Tmp1 = SelectExpr(N.getOperand(0));
861 Tmp2 = SelectExpr(N.getOperand(1));
862 BuildMI(BB, Opc, 2, Result).addReg(Tmp1).addReg(Tmp2);
868 case ISD::MUL: Opc = DestType == MVT::f64 ? PPC::FMUL : PPC::FMULS; break;
869 case ISD::SDIV: Opc = DestType == MVT::f64 ? PPC::FDIV : PPC::FDIVS; break;
871 Tmp1 = SelectExpr(N.getOperand(0));
872 Tmp2 = SelectExpr(N.getOperand(1));
873 BuildMI(BB, Opc, 2, Result).addReg(Tmp1).addReg(Tmp2);
876 case ISD::UINT_TO_FP:
877 case ISD::SINT_TO_FP: {
878 bool IsUnsigned = (ISD::UINT_TO_FP == opcode);
879 Tmp1 = SelectExpr(N.getOperand(0)); // Get the operand register
880 Tmp2 = MakeReg(MVT::f64); // temp reg to load the integer value into
881 Tmp3 = MakeReg(MVT::i64); // temp reg to hold the conversion constant
882 unsigned ConstF = MakeReg(MVT::f64); // temp reg to hold the fp constant
884 int FrameIdx = BB->getParent()->getFrameInfo()->CreateStackObject(8, 8);
885 MachineConstantPool *CP = BB->getParent()->getConstantPool();
887 // FIXME: pull this FP constant generation stuff out into something like
888 // the simple ISel's getReg.
890 addFrameReference(BuildMI(BB, PPC::STD, 3).addReg(Tmp1), FrameIdx);
891 addFrameReference(BuildMI(BB, PPC::LFD, 2, Tmp2), FrameIdx);
892 BuildMI(BB, PPC::FCFID, 1, Result).addReg(Tmp2);
894 ConstantFP *CFP = ConstantFP::get(Type::DoubleTy, 0x1.000008p52);
895 unsigned CPI = CP->getConstantPoolIndex(CFP);
896 // Load constant fp value
897 unsigned Tmp4 = MakeReg(MVT::i32);
898 unsigned TmpL = MakeReg(MVT::i32);
899 BuildMI(BB, PPC::LOADHiAddr, 2, Tmp4).addReg(getGlobalBaseReg())
900 .addConstantPoolIndex(CPI);
901 BuildMI(BB, PPC::LFD, 2, ConstF).addConstantPoolIndex(CPI).addReg(Tmp4);
902 // Store the hi & low halves of the fp value, currently in int regs
903 BuildMI(BB, PPC::LIS, 1, Tmp3).addSImm(0x4330);
904 addFrameReference(BuildMI(BB, PPC::STW, 3).addReg(Tmp3), FrameIdx);
905 BuildMI(BB, PPC::XORIS, 2, TmpL).addReg(Tmp1).addImm(0x8000);
906 addFrameReference(BuildMI(BB, PPC::STW, 3).addReg(TmpL), FrameIdx, 4);
907 addFrameReference(BuildMI(BB, PPC::LFD, 2, Tmp2), FrameIdx);
908 // Generate the return value with a subtract
909 BuildMI(BB, PPC::FSUB, 2, Result).addReg(Tmp2).addReg(ConstF);
914 assert(0 && "Should never get here");
918 unsigned ISel::SelectExpr(SDOperand N) {
920 unsigned Tmp1, Tmp2, Tmp3;
922 unsigned opcode = N.getOpcode();
924 SDNode *Node = N.Val;
925 MVT::ValueType DestType = N.getValueType();
927 unsigned &Reg = ExprMap[N];
930 switch (N.getOpcode()) {
932 Reg = Result = (N.getValueType() != MVT::Other) ?
933 MakeReg(N.getValueType()) : 1;
936 // If this is a call instruction, make sure to prepare ALL of the result
937 // values as well as the chain.
938 if (Node->getNumValues() == 1)
939 Reg = Result = 1; // Void call, just a chain.
941 Result = MakeReg(Node->getValueType(0));
942 ExprMap[N.getValue(0)] = Result;
943 for (unsigned i = 1, e = N.Val->getNumValues()-1; i != e; ++i)
944 ExprMap[N.getValue(i)] = MakeReg(Node->getValueType(i));
945 ExprMap[SDOperand(Node, Node->getNumValues()-1)] = 1;
950 if (ISD::CopyFromReg == opcode)
951 DestType = N.getValue(0).getValueType();
953 if (DestType == MVT::f64 || DestType == MVT::f32)
954 if (ISD::LOAD != opcode && ISD::EXTLOAD != opcode && ISD::UNDEF != opcode)
955 return SelectExprFP(N, Result);
960 assert(0 && "Node not handled!\n");
962 BuildMI(BB, PPC::IMPLICIT_DEF, 0, Result);
964 case ISD::DYNAMIC_STACKALLOC:
965 // Generate both result values. FIXME: Need a better commment here?
967 ExprMap[N.getValue(1)] = 1;
969 Result = ExprMap[N.getValue(0)] = MakeReg(N.getValue(0).getValueType());
971 // FIXME: We are currently ignoring the requested alignment for handling
972 // greater than the stack alignment. This will need to be revisited at some
973 // point. Align = N.getOperand(2);
974 if (!isa<ConstantSDNode>(N.getOperand(2)) ||
975 cast<ConstantSDNode>(N.getOperand(2))->getValue() != 0) {
976 std::cerr << "Cannot allocate stack object with greater alignment than"
977 << " the stack alignment yet!";
980 Select(N.getOperand(0));
981 Tmp1 = SelectExpr(N.getOperand(1));
982 // Subtract size from stack pointer, thereby allocating some space.
983 BuildMI(BB, PPC::SUBF, 2, PPC::R1).addReg(Tmp1).addReg(PPC::R1);
984 // Put a pointer to the space into the result register by copying the SP
985 BuildMI(BB, PPC::OR, 2, Result).addReg(PPC::R1).addReg(PPC::R1);
988 case ISD::ConstantPool:
989 Tmp1 = cast<ConstantPoolSDNode>(N)->getIndex();
990 Tmp2 = MakeReg(MVT::i64);
991 BuildMI(BB, PPC::LOADHiAddr, 2, Tmp2).addReg(getGlobalBaseReg())
992 .addConstantPoolIndex(Tmp1);
993 BuildMI(BB, PPC::LA, 2, Result).addReg(Tmp2).addConstantPoolIndex(Tmp1);
996 case ISD::FrameIndex:
997 Tmp1 = cast<FrameIndexSDNode>(N)->getIndex();
998 addFrameReference(BuildMI(BB, PPC::ADDI, 2, Result), (int)Tmp1, 0, false);
1001 case ISD::GlobalAddress: {
1002 GlobalValue *GV = cast<GlobalAddressSDNode>(N)->getGlobal();
1003 Tmp1 = MakeReg(MVT::i64);
1004 BuildMI(BB, PPC::LOADHiAddr, 2, Tmp1).addReg(getGlobalBaseReg())
1005 .addGlobalAddress(GV);
1006 if (GV->hasWeakLinkage() || GV->isExternal()) {
1007 BuildMI(BB, PPC::LD, 2, Result).addGlobalAddress(GV).addReg(Tmp1);
1009 BuildMI(BB, PPC::LA, 2, Result).addReg(Tmp1).addGlobalAddress(GV);
1017 case ISD::SEXTLOAD: {
1018 MVT::ValueType TypeBeingLoaded = (ISD::LOAD == opcode) ?
1019 Node->getValueType(0) : cast<MVTSDNode>(Node)->getExtraValueType();
1020 bool sext = (ISD::SEXTLOAD == opcode);
1022 // Make sure we generate both values.
1024 ExprMap[N.getValue(1)] = 1; // Generate the token
1026 Result = ExprMap[N.getValue(0)] = MakeReg(N.getValue(0).getValueType());
1028 SDOperand Chain = N.getOperand(0);
1029 SDOperand Address = N.getOperand(1);
1032 switch (TypeBeingLoaded) {
1033 default: Node->dump(); assert(0 && "Cannot load this type!");
1034 case MVT::i1: Opc = PPC::LBZ; break;
1035 case MVT::i8: Opc = PPC::LBZ; break;
1036 case MVT::i16: Opc = sext ? PPC::LHA : PPC::LHZ; break;
1037 case MVT::i32: Opc = sext ? PPC::LWA : PPC::LWZ; break;
1038 case MVT::i64: Opc = PPC::LD; break;
1039 case MVT::f32: Opc = PPC::LFS; break;
1040 case MVT::f64: Opc = PPC::LFD; break;
1043 if (ConstantPoolSDNode *CP = dyn_cast<ConstantPoolSDNode>(Address)) {
1044 Tmp1 = MakeReg(MVT::i64);
1045 int CPI = CP->getIndex();
1046 BuildMI(BB, PPC::LOADHiAddr, 2, Tmp1).addReg(getGlobalBaseReg())
1047 .addConstantPoolIndex(CPI);
1048 BuildMI(BB, Opc, 2, Result).addConstantPoolIndex(CPI).addReg(Tmp1);
1050 else if(Address.getOpcode() == ISD::FrameIndex) {
1051 Tmp1 = cast<FrameIndexSDNode>(Address)->getIndex();
1052 addFrameReference(BuildMI(BB, Opc, 2, Result), (int)Tmp1);
1055 bool idx = SelectAddr(Address, Tmp1, offset);
1057 Opc = IndexedOpForOp(Opc);
1058 BuildMI(BB, Opc, 2, Result).addReg(Tmp1).addReg(offset);
1060 BuildMI(BB, Opc, 2, Result).addSImm(offset).addReg(Tmp1);
1067 unsigned GPR_idx = 0, FPR_idx = 0;
1068 static const unsigned GPR[] = {
1069 PPC::R3, PPC::R4, PPC::R5, PPC::R6,
1070 PPC::R7, PPC::R8, PPC::R9, PPC::R10,
1072 static const unsigned FPR[] = {
1073 PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,
1074 PPC::F8, PPC::F9, PPC::F10, PPC::F11, PPC::F12, PPC::F13
1077 // Lower the chain for this call.
1078 Select(N.getOperand(0));
1079 ExprMap[N.getValue(Node->getNumValues()-1)] = 1;
1081 MachineInstr *CallMI;
1082 // Emit the correct call instruction based on the type of symbol called.
1083 if (GlobalAddressSDNode *GASD =
1084 dyn_cast<GlobalAddressSDNode>(N.getOperand(1))) {
1085 CallMI = BuildMI(PPC::CALLpcrel, 1).addGlobalAddress(GASD->getGlobal(),
1087 } else if (ExternalSymbolSDNode *ESSDN =
1088 dyn_cast<ExternalSymbolSDNode>(N.getOperand(1))) {
1089 CallMI = BuildMI(PPC::CALLpcrel, 1).addExternalSymbol(ESSDN->getSymbol(),
1092 Tmp1 = SelectExpr(N.getOperand(1));
1093 BuildMI(BB, PPC::OR, 2, PPC::R12).addReg(Tmp1).addReg(Tmp1);
1094 BuildMI(BB, PPC::MTCTR, 1).addReg(PPC::R12);
1095 CallMI = BuildMI(PPC::CALLindirect, 3).addImm(20).addImm(0)
1099 // Load the register args to virtual regs
1100 std::vector<unsigned> ArgVR;
1101 for(int i = 2, e = Node->getNumOperands(); i < e; ++i)
1102 ArgVR.push_back(SelectExpr(N.getOperand(i)));
1104 // Copy the virtual registers into the appropriate argument register
1105 for(int i = 0, e = ArgVR.size(); i < e; ++i) {
1106 switch(N.getOperand(i+2).getValueType()) {
1107 default: Node->dump(); assert(0 && "Unknown value type for call");
1113 assert(GPR_idx < 8 && "Too many int args");
1114 if (N.getOperand(i+2).getOpcode() != ISD::UNDEF) {
1115 BuildMI(BB, PPC::OR,2,GPR[GPR_idx]).addReg(ArgVR[i]).addReg(ArgVR[i]);
1116 CallMI->addRegOperand(GPR[GPR_idx], MachineOperand::Use);
1122 assert(FPR_idx < 13 && "Too many fp args");
1123 BuildMI(BB, PPC::FMR, 1, FPR[FPR_idx]).addReg(ArgVR[i]);
1124 CallMI->addRegOperand(FPR[FPR_idx], MachineOperand::Use);
1130 // Put the call instruction in the correct place in the MachineBasicBlock
1131 BB->push_back(CallMI);
1133 switch (Node->getValueType(0)) {
1134 default: assert(0 && "Unknown value type for call result!");
1135 case MVT::Other: return 1;
1141 BuildMI(BB, PPC::OR, 2, Result).addReg(PPC::R3).addReg(PPC::R3);
1145 BuildMI(BB, PPC::FMR, 1, Result).addReg(PPC::F1);
1148 return Result+N.ResNo;
1151 case ISD::SIGN_EXTEND:
1152 case ISD::SIGN_EXTEND_INREG:
1153 Tmp1 = SelectExpr(N.getOperand(0));
1154 switch(cast<MVTSDNode>(Node)->getExtraValueType()) {
1155 default: Node->dump(); assert(0 && "Unhandled SIGN_EXTEND type"); break;
1157 BuildMI(BB, PPC::EXTSW, 1, Result).addReg(Tmp1);
1160 BuildMI(BB, PPC::EXTSH, 1, Result).addReg(Tmp1);
1163 BuildMI(BB, PPC::EXTSB, 1, Result).addReg(Tmp1);
1166 BuildMI(BB, PPC::SUBFIC, 2, Result).addReg(Tmp1).addSImm(0);
1171 case ISD::CopyFromReg:
1173 Result = ExprMap[N.getValue(0)] = MakeReg(N.getValue(0).getValueType());
1174 Tmp1 = dyn_cast<RegSDNode>(Node)->getReg();
1175 BuildMI(BB, PPC::OR, 2, Result).addReg(Tmp1).addReg(Tmp1);
1179 Tmp1 = SelectExpr(N.getOperand(0));
1180 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.getOperand(1))) {
1181 Tmp2 = CN->getValue() & 0x3F;
1182 BuildMI(BB, PPC::RLDICR, 3, Result).addReg(Tmp1).addImm(Tmp2)
1185 Tmp2 = SelectExpr(N.getOperand(1));
1186 BuildMI(BB, PPC::SLD, 2, Result).addReg(Tmp1).addReg(Tmp2);
1191 Tmp1 = SelectExpr(N.getOperand(0));
1192 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.getOperand(1))) {
1193 Tmp2 = CN->getValue() & 0x3F;
1194 BuildMI(BB, PPC::RLDICL, 3, Result).addReg(Tmp1).addImm(64-Tmp2)
1197 Tmp2 = SelectExpr(N.getOperand(1));
1198 BuildMI(BB, PPC::SRD, 2, Result).addReg(Tmp1).addReg(Tmp2);
1203 Tmp1 = SelectExpr(N.getOperand(0));
1204 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N.getOperand(1))) {
1205 Tmp2 = CN->getValue() & 0x3F;
1206 BuildMI(BB, PPC::SRADI, 2, Result).addReg(Tmp1).addImm(Tmp2);
1208 Tmp2 = SelectExpr(N.getOperand(1));
1209 BuildMI(BB, PPC::SRAD, 2, Result).addReg(Tmp1).addReg(Tmp2);
1214 Tmp1 = SelectExpr(N.getOperand(0));
1215 switch(getImmediateForOpcode(N.getOperand(1), opcode, Tmp2)) {
1216 default: assert(0 && "unhandled result code");
1217 case 0: // No immediate
1218 Tmp2 = SelectExpr(N.getOperand(1));
1219 BuildMI(BB, PPC::ADD, 2, Result).addReg(Tmp1).addReg(Tmp2);
1221 case 1: // Low immediate
1222 BuildMI(BB, PPC::ADDI, 2, Result).addReg(Tmp1).addSImm(Tmp2);
1224 case 2: // Shifted immediate
1225 BuildMI(BB, PPC::ADDIS, 2, Result).addReg(Tmp1).addSImm(Tmp2);
1232 Tmp1 = SelectExpr(N.getOperand(0));
1233 switch(getImmediateForOpcode(N.getOperand(1), opcode, Tmp2)) {
1234 default: assert(0 && "unhandled result code");
1235 case 0: // No immediate
1236 Tmp2 = SelectExpr(N.getOperand(1));
1238 case ISD::AND: Opc = PPC::AND; break;
1239 case ISD::OR: Opc = PPC::OR; break;
1241 BuildMI(BB, Opc, 2, Result).addReg(Tmp1).addReg(Tmp2);
1243 case 1: // Low immediate
1245 case ISD::AND: Opc = PPC::ANDIo; break;
1246 case ISD::OR: Opc = PPC::ORI; break;
1248 BuildMI(BB, Opc, 2, Result).addReg(Tmp1).addImm(Tmp2);
1250 case 2: // Shifted immediate
1252 case ISD::AND: Opc = PPC::ANDISo; break;
1253 case ISD::OR: Opc = PPC::ORIS; break;
1255 BuildMI(BB, Opc, 2, Result).addReg(Tmp1).addImm(Tmp2);
1261 // Check for EQV: xor, (xor a, -1), b
1262 if (N.getOperand(0).getOpcode() == ISD::XOR &&
1263 N.getOperand(0).getOperand(1).getOpcode() == ISD::Constant &&
1264 cast<ConstantSDNode>(N.getOperand(0).getOperand(1))->isAllOnesValue()) {
1266 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
1267 Tmp2 = SelectExpr(N.getOperand(1));
1268 BuildMI(BB, PPC::EQV, 2, Result).addReg(Tmp1).addReg(Tmp2);
1271 // Check for NOT, NOR, and NAND: xor (copy, or, and), -1
1272 if (N.getOperand(1).getOpcode() == ISD::Constant &&
1273 cast<ConstantSDNode>(N.getOperand(1))->isAllOnesValue()) {
1275 switch(N.getOperand(0).getOpcode()) {
1277 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
1278 Tmp2 = SelectExpr(N.getOperand(0).getOperand(1));
1279 BuildMI(BB, PPC::NOR, 2, Result).addReg(Tmp1).addReg(Tmp2);
1282 Tmp1 = SelectExpr(N.getOperand(0).getOperand(0));
1283 Tmp2 = SelectExpr(N.getOperand(0).getOperand(1));
1284 BuildMI(BB, PPC::NAND, 2, Result).addReg(Tmp1).addReg(Tmp2);
1287 Tmp1 = SelectExpr(N.getOperand(0));
1288 BuildMI(BB, PPC::NOR, 2, Result).addReg(Tmp1).addReg(Tmp1);
1293 Tmp1 = SelectExpr(N.getOperand(0));
1294 switch(getImmediateForOpcode(N.getOperand(1), opcode, Tmp2)) {
1295 default: assert(0 && "unhandled result code");
1296 case 0: // No immediate
1297 Tmp2 = SelectExpr(N.getOperand(1));
1298 BuildMI(BB, PPC::XOR, 2, Result).addReg(Tmp1).addReg(Tmp2);
1300 case 1: // Low immediate
1301 BuildMI(BB, PPC::XORI, 2, Result).addReg(Tmp1).addImm(Tmp2);
1303 case 2: // Shifted immediate
1304 BuildMI(BB, PPC::XORIS, 2, Result).addReg(Tmp1).addImm(Tmp2);
1311 Tmp2 = SelectExpr(N.getOperand(1));
1312 if (1 == getImmediateForOpcode(N.getOperand(0), opcode, Tmp1))
1313 BuildMI(BB, PPC::SUBFIC, 2, Result).addReg(Tmp2).addSImm(Tmp1);
1315 Tmp1 = SelectExpr(N.getOperand(0));
1316 BuildMI(BB, PPC::SUBF, 2, Result).addReg(Tmp2).addReg(Tmp1);
1321 Tmp1 = SelectExpr(N.getOperand(0));
1322 if (1 == getImmediateForOpcode(N.getOperand(1), opcode, Tmp2))
1323 BuildMI(BB, PPC::MULLI, 2, Result).addReg(Tmp1).addSImm(Tmp2);
1325 Tmp2 = SelectExpr(N.getOperand(1));
1326 BuildMI(BB, PPC::MULLD, 2, Result).addReg(Tmp1).addReg(Tmp2);
1332 if (3 == getImmediateForOpcode(N.getOperand(1), opcode, Tmp3)) {
1333 Tmp1 = MakeReg(MVT::i64);
1334 Tmp2 = SelectExpr(N.getOperand(0));
1335 BuildMI(BB, PPC::SRADI, 2, Tmp1).addReg(Tmp2).addImm(Tmp3);
1336 BuildMI(BB, PPC::ADDZE, 1, Result).addReg(Tmp1);
1339 Tmp1 = SelectExpr(N.getOperand(0));
1340 Tmp2 = SelectExpr(N.getOperand(1));
1341 Opc = (ISD::UDIV == opcode) ? PPC::DIVWU : PPC::DIVW;
1342 BuildMI(BB, Opc, 2, Result).addReg(Tmp1).addReg(Tmp2);
1345 case ISD::FP_TO_UINT:
1346 case ISD::FP_TO_SINT: {
1347 Tmp1 = SelectExpr(N.getOperand(0));
1348 Tmp2 = MakeReg(MVT::f64);
1349 BuildMI(BB, PPC::FCTIDZ, 1, Tmp2).addReg(Tmp1);
1350 int FrameIdx = BB->getParent()->getFrameInfo()->CreateStackObject(8, 8);
1351 addFrameReference(BuildMI(BB, PPC::STFD, 3).addReg(Tmp2), FrameIdx);
1352 addFrameReference(BuildMI(BB, PPC::LD, 2, Result), FrameIdx);
1357 if (SetCCSDNode *SetCC = dyn_cast<SetCCSDNode>(Node)) {
1358 Opc = SelectSetCR0(N);
1360 unsigned TrueValue = MakeReg(MVT::i32);
1361 BuildMI(BB, PPC::LI, 1, TrueValue).addSImm(1);
1362 unsigned FalseValue = MakeReg(MVT::i32);
1363 BuildMI(BB, PPC::LI, 1, FalseValue).addSImm(0);
1365 // Create an iterator with which to insert the MBB for copying the false
1366 // value and the MBB to hold the PHI instruction for this SetCC.
1367 MachineBasicBlock *thisMBB = BB;
1368 const BasicBlock *LLVM_BB = BB->getBasicBlock();
1369 ilist<MachineBasicBlock>::iterator It = BB;
1374 // cmpTY cr0, r1, r2
1375 // %TrueValue = li 1
1377 MachineBasicBlock *copy0MBB = new MachineBasicBlock(LLVM_BB);
1378 MachineBasicBlock *sinkMBB = new MachineBasicBlock(LLVM_BB);
1379 BuildMI(BB, Opc, 2).addReg(PPC::CR0).addMBB(sinkMBB);
1380 MachineFunction *F = BB->getParent();
1381 F->getBasicBlockList().insert(It, copy0MBB);
1382 F->getBasicBlockList().insert(It, sinkMBB);
1383 // Update machine-CFG edges
1384 BB->addSuccessor(copy0MBB);
1385 BB->addSuccessor(sinkMBB);
1388 // %FalseValue = li 0
1391 // Update machine-CFG edges
1392 BB->addSuccessor(sinkMBB);
1395 // %Result = phi [ %FalseValue, copy0MBB ], [ %TrueValue, thisMBB ]
1398 BuildMI(BB, PPC::PHI, 4, Result).addReg(FalseValue)
1399 .addMBB(copy0MBB).addReg(TrueValue).addMBB(thisMBB);
1402 assert(0 && "Is this legal?");
1406 unsigned TrueValue = SelectExpr(N.getOperand(1)); //Use if TRUE
1407 unsigned FalseValue = SelectExpr(N.getOperand(2)); //Use if FALSE
1408 Opc = SelectSetCR0(N.getOperand(0));
1410 // Create an iterator with which to insert the MBB for copying the false
1411 // value and the MBB to hold the PHI instruction for this SetCC.
1412 MachineBasicBlock *thisMBB = BB;
1413 const BasicBlock *LLVM_BB = BB->getBasicBlock();
1414 ilist<MachineBasicBlock>::iterator It = BB;
1420 // cmpTY cr0, r1, r2
1422 // fallthrough --> copy0MBB
1423 MachineBasicBlock *copy0MBB = new MachineBasicBlock(LLVM_BB);
1424 MachineBasicBlock *sinkMBB = new MachineBasicBlock(LLVM_BB);
1425 BuildMI(BB, Opc, 2).addReg(PPC::CR0).addMBB(sinkMBB);
1426 MachineFunction *F = BB->getParent();
1427 F->getBasicBlockList().insert(It, copy0MBB);
1428 F->getBasicBlockList().insert(It, sinkMBB);
1429 // Update machine-CFG edges
1430 BB->addSuccessor(copy0MBB);
1431 BB->addSuccessor(sinkMBB);
1434 // %FalseValue = ...
1435 // # fallthrough to sinkMBB
1437 // Update machine-CFG edges
1438 BB->addSuccessor(sinkMBB);
1441 // %Result = phi [ %FalseValue, copy0MBB ], [ %TrueValue, thisMBB ]
1444 BuildMI(BB, PPC::PHI, 4, Result).addReg(FalseValue)
1445 .addMBB(copy0MBB).addReg(TrueValue).addMBB(thisMBB);
1447 // FIXME: Select i64?
1452 switch (N.getValueType()) {
1453 default: assert(0 && "Cannot use constants of this type!");
1455 BuildMI(BB, PPC::LI, 1, Result)
1456 .addSImm(!cast<ConstantSDNode>(N)->isNullValue());
1460 int v = (int)cast<ConstantSDNode>(N)->getSignExtended();
1461 if (v < 32768 && v >= -32768) {
1462 BuildMI(BB, PPC::LI, 1, Result).addSImm(v);
1464 Tmp1 = MakeReg(MVT::i32);
1465 BuildMI(BB, PPC::LIS, 1, Tmp1).addSImm(v >> 16);
1466 BuildMI(BB, PPC::ORI, 2, Result).addReg(Tmp1).addImm(v & 0xFFFF);
1476 void ISel::Select(SDOperand N) {
1477 unsigned Tmp1, Tmp2, Opc;
1478 unsigned opcode = N.getOpcode();
1480 if (!ExprMap.insert(std::make_pair(N, 1)).second)
1481 return; // Already selected.
1483 SDNode *Node = N.Val;
1485 switch (Node->getOpcode()) {
1487 Node->dump(); std::cerr << "\n";
1488 assert(0 && "Node not handled yet!");
1489 case ISD::EntryToken: return; // Noop
1490 case ISD::TokenFactor:
1491 for (unsigned i = 0, e = Node->getNumOperands(); i != e; ++i)
1492 Select(Node->getOperand(i));
1494 case ISD::ADJCALLSTACKDOWN:
1495 case ISD::ADJCALLSTACKUP:
1496 Select(N.getOperand(0));
1497 Tmp1 = cast<ConstantSDNode>(N.getOperand(1))->getValue();
1498 Opc = N.getOpcode() == ISD::ADJCALLSTACKDOWN ? PPC::ADJCALLSTACKDOWN :
1499 PPC::ADJCALLSTACKUP;
1500 BuildMI(BB, Opc, 1).addImm(Tmp1);
1503 MachineBasicBlock *Dest =
1504 cast<BasicBlockSDNode>(N.getOperand(1))->getBasicBlock();
1505 Select(N.getOperand(0));
1506 BuildMI(BB, PPC::B, 1).addMBB(Dest);
1512 case ISD::CopyToReg:
1513 Select(N.getOperand(0));
1514 Tmp1 = SelectExpr(N.getOperand(1));
1515 Tmp2 = cast<RegSDNode>(N)->getReg();
1518 if (N.getOperand(1).getValueType() == MVT::f64 ||
1519 N.getOperand(1).getValueType() == MVT::f32)
1520 BuildMI(BB, PPC::FMR, 1, Tmp2).addReg(Tmp1);
1522 BuildMI(BB, PPC::OR, 2, Tmp2).addReg(Tmp1).addReg(Tmp1);
1525 case ISD::ImplicitDef:
1526 Select(N.getOperand(0));
1527 BuildMI(BB, PPC::IMPLICIT_DEF, 0, cast<RegSDNode>(N)->getReg());
1530 switch (N.getNumOperands()) {
1532 assert(0 && "Unknown return instruction!");
1534 assert(N.getOperand(1).getValueType() == MVT::i32 &&
1535 N.getOperand(2).getValueType() == MVT::i32 &&
1536 "Unknown two-register value!");
1537 Select(N.getOperand(0));
1538 Tmp1 = SelectExpr(N.getOperand(1));
1539 Tmp2 = SelectExpr(N.getOperand(2));
1540 BuildMI(BB, PPC::OR, 2, PPC::R3).addReg(Tmp2).addReg(Tmp2);
1541 BuildMI(BB, PPC::OR, 2, PPC::R4).addReg(Tmp1).addReg(Tmp1);
1544 Select(N.getOperand(0));
1545 Tmp1 = SelectExpr(N.getOperand(1));
1546 switch (N.getOperand(1).getValueType()) {
1548 assert(0 && "Unknown return type!");
1551 BuildMI(BB, PPC::FMR, 1, PPC::F1).addReg(Tmp1);
1554 BuildMI(BB, PPC::OR, 2, PPC::R3).addReg(Tmp1).addReg(Tmp1);
1558 Select(N.getOperand(0));
1561 BuildMI(BB, PPC::BLR, 0); // Just emit a 'ret' instruction
1563 case ISD::TRUNCSTORE:
1566 SDOperand Chain = N.getOperand(0);
1567 SDOperand Value = N.getOperand(1);
1568 SDOperand Address = N.getOperand(2);
1571 Tmp1 = SelectExpr(Value); //value
1573 if (opcode == ISD::STORE) {
1574 switch(Value.getValueType()) {
1575 default: assert(0 && "unknown Type in store");
1576 case MVT::i64: Opc = PPC::STD; break;
1577 case MVT::f64: Opc = PPC::STFD; break;
1578 case MVT::f32: Opc = PPC::STFS; break;
1580 } else { //ISD::TRUNCSTORE
1581 switch(cast<MVTSDNode>(Node)->getExtraValueType()) {
1582 default: assert(0 && "unknown Type in store");
1583 case MVT::i1: //FIXME: DAG does not promote this load
1584 case MVT::i8: Opc= PPC::STB; break;
1585 case MVT::i16: Opc = PPC::STH; break;
1586 case MVT::i32: Opc = PPC::STW; break;
1590 if(Address.getOpcode() == ISD::FrameIndex)
1592 Tmp2 = cast<FrameIndexSDNode>(Address)->getIndex();
1593 addFrameReference(BuildMI(BB, Opc, 3).addReg(Tmp1), (int)Tmp2);
1598 bool idx = SelectAddr(Address, Tmp2, offset);
1600 Opc = IndexedOpForOp(Opc);
1601 BuildMI(BB, Opc, 3).addReg(Tmp1).addReg(Tmp2).addReg(offset);
1603 BuildMI(BB, Opc, 3).addReg(Tmp1).addImm(offset).addReg(Tmp2);
1612 case ISD::CopyFromReg:
1614 case ISD::DYNAMIC_STACKALLOC:
1619 assert(0 && "Should not be reached!");
1623 /// createPPC32PatternInstructionSelector - This pass converts an LLVM function
1624 /// into a machine code representation using pattern matching and a machine
1625 /// description file.
1627 FunctionPass *llvm::createPPC64ISelPattern(TargetMachine &TM) {
1628 return new ISel(TM);