lib/CodeGen/SelectionDAG/LegalizeDAG.cpp

   1 //===-- LegalizeDAG.cpp - Implement SelectionDAG::Legalize ----------------===//
   2 //
   3 //                     The LLVM Compiler Infrastructure
   4 //
   5 // This file is distributed under the University of Illinois Open Source
   6 // License. See LICENSE.TXT for details.
   7 //
   8 //===----------------------------------------------------------------------===//
   9 //
  10 // This file implements the SelectionDAG::Legalize method.
  11 //
  12 //===----------------------------------------------------------------------===//
  13
  14 #include "llvm/Analysis/DebugInfo.h"
  15 #include "llvm/CodeGen/Analysis.h"
  16 #include "llvm/CodeGen/MachineFunction.h"
  17 #include "llvm/CodeGen/MachineJumpTableInfo.h"
  18 #include "llvm/CodeGen/SelectionDAG.h"
  19 #include "llvm/Target/TargetFrameLowering.h"
  20 #include "llvm/Target/TargetLowering.h"
  21 #include "llvm/Target/TargetData.h"
  22 #include "llvm/Target/TargetMachine.h"
  23 #include "llvm/CallingConv.h"
  24 #include "llvm/Constants.h"
  25 #include "llvm/DerivedTypes.h"
  26 #include "llvm/LLVMContext.h"
  27 #include "llvm/Support/Debug.h"
  28 #include "llvm/Support/ErrorHandling.h"
  29 #include "llvm/Support/MathExtras.h"
  30 #include "llvm/Support/raw_ostream.h"
  31 #include "llvm/ADT/DenseMap.h"
  32 #include "llvm/ADT/SmallVector.h"
  33 #include "llvm/ADT/SmallPtrSet.h"
  34 using namespace llvm;
  35
  36 //===----------------------------------------------------------------------===//
  37 /// SelectionDAGLegalize - This takes an arbitrary SelectionDAG as input and
  38 /// hacks on it until the target machine can handle it.  This involves
  39 /// eliminating value sizes the machine cannot handle (promoting small sizes to
  40 /// large sizes or splitting up large values into small values) as well as
  41 /// eliminating operations the machine cannot handle.
  42 ///
  43 /// This code also does a small amount of optimization and recognition of idioms
  44 /// as part of its processing.  For example, if a target does not support a
  45 /// 'setcc' instruction efficiently, but does support 'brcc' instruction, this
  46 /// will attempt merge setcc and brc instructions into brcc's.
  47 ///
  48 namespace {
  49 class SelectionDAGLegalize {
  50   const TargetMachine &TM;
  51   const TargetLowering &TLI;
  52   SelectionDAG &DAG;
  53
  54   // Libcall insertion helpers.
  55
  56   /// LastCALLSEQ - This keeps track of the CALLSEQ_END node that has been
  57   /// legalized.  We use this to ensure that calls are properly serialized
  58   /// against each other, including inserted libcalls.
  59   SmallVector<SDValue, 8> LastCALLSEQ;
  60
  61   enum LegalizeAction {
  62     Legal,      // The target natively supports this operation.
  63     Promote,    // This operation should be executed in a larger type.
  64     Expand      // Try to expand this to other ops, otherwise use a libcall.
  65   };
  66
  67   /// LegalizedNodes - For nodes that are of legal width, and that have more
  68   /// than one use, this map indicates what regularized operand to use.  This
  69   /// allows us to avoid legalizing the same thing more than once.
  70   DenseMap<SDValue, SDValue> LegalizedNodes;
  71
  72   void AddLegalizedOperand(SDValue From, SDValue To) {
  73     LegalizedNodes.insert(std::make_pair(From, To));
  74     // If someone requests legalization of the new node, return itself.
  75     if (From != To)
  76       LegalizedNodes.insert(std::make_pair(To, To));
  77
  78     // Transfer SDDbgValues.
  79     DAG.TransferDbgValues(From, To);
  80   }
  81
  82 public:
  83   explicit SelectionDAGLegalize(SelectionDAG &DAG);
  84
  85   void LegalizeDAG();
  86
  87 private:
  88   /// LegalizeOp - Return a legal replacement for the given operation, with
  89   /// all legal operands.
  90   SDValue LegalizeOp(SDValue O);
  91
  92   SDValue OptimizeFloatStore(StoreSDNode *ST);
  93
  94   /// PerformInsertVectorEltInMemory - Some target cannot handle a variable
  95   /// insertion index for the INSERT_VECTOR_ELT instruction.  In this case, it
  96   /// is necessary to spill the vector being inserted into to memory, perform
  97   /// the insert there, and then read the result back.
  98   SDValue PerformInsertVectorEltInMemory(SDValue Vec, SDValue Val,
  99                                          SDValue Idx, DebugLoc dl);
 100   SDValue ExpandINSERT_VECTOR_ELT(SDValue Vec, SDValue Val,
 101                                   SDValue Idx, DebugLoc dl);
 102
 103   /// ShuffleWithNarrowerEltType - Return a vector shuffle operation which
 104   /// performs the same shuffe in terms of order or result bytes, but on a type
 105   /// whose vector element type is narrower than the original shuffle type.
 106   /// e.g. <v4i32> <0, 1, 0, 1> -> v8i16 <0, 1, 2, 3, 0, 1, 2, 3>
 107   SDValue ShuffleWithNarrowerEltType(EVT NVT, EVT VT, DebugLoc dl,
 108                                      SDValue N1, SDValue N2,
 109                                      SmallVectorImpl<int> &Mask) const;
 110
 111   bool LegalizeAllNodesNotLeadingTo(SDNode *N, SDNode *Dest,
 112                                     SmallPtrSet<SDNode*, 32> &NodesLeadingTo);
 113
 114   void LegalizeSetCCCondCode(EVT VT, SDValue &LHS, SDValue &RHS, SDValue &CC,
 115                              DebugLoc dl);
 116
 117   SDValue ExpandLibCall(RTLIB::Libcall LC, SDNode *Node, bool isSigned);
 118   SDValue ExpandLibCall(RTLIB::Libcall LC, EVT RetVT, const SDValue *Ops,
 119                         unsigned NumOps, bool isSigned, DebugLoc dl);
 120
 121   std::pair<SDValue, SDValue> ExpandChainLibCall(RTLIB::Libcall LC,
 122                                                  SDNode *Node, bool isSigned);
 123   SDValue ExpandFPLibCall(SDNode *Node, RTLIB::Libcall Call_F32,
 124                           RTLIB::Libcall Call_F64, RTLIB::Libcall Call_F80,
 125                           RTLIB::Libcall Call_PPCF128);
 126   SDValue ExpandIntLibCall(SDNode *Node, bool isSigned,
 127                            RTLIB::Libcall Call_I8,
 128                            RTLIB::Libcall Call_I16,
 129                            RTLIB::Libcall Call_I32,
 130                            RTLIB::Libcall Call_I64,
 131                            RTLIB::Libcall Call_I128);
 132   void ExpandDivRemLibCall(SDNode *Node, SmallVectorImpl<SDValue> &Results);
 133
 134   SDValue EmitStackConvert(SDValue SrcOp, EVT SlotVT, EVT DestVT, DebugLoc dl);
 135   SDValue ExpandBUILD_VECTOR(SDNode *Node);
 136   SDValue ExpandSCALAR_TO_VECTOR(SDNode *Node);
 137   void ExpandDYNAMIC_STACKALLOC(SDNode *Node,
 138                                 SmallVectorImpl<SDValue> &Results);
 139   SDValue ExpandFCOPYSIGN(SDNode *Node);
 140   SDValue ExpandLegalINT_TO_FP(bool isSigned, SDValue LegalOp, EVT DestVT,
 141                                DebugLoc dl);
 142   SDValue PromoteLegalINT_TO_FP(SDValue LegalOp, EVT DestVT, bool isSigned,
 143                                 DebugLoc dl);
 144   SDValue PromoteLegalFP_TO_INT(SDValue LegalOp, EVT DestVT, bool isSigned,
 145                                 DebugLoc dl);
 146
 147   SDValue ExpandBSWAP(SDValue Op, DebugLoc dl);
 148   SDValue ExpandBitCount(unsigned Opc, SDValue Op, DebugLoc dl);
 149
 150   SDValue ExpandExtractFromVectorThroughStack(SDValue Op);
 151   SDValue ExpandInsertToVectorThroughStack(SDValue Op);
 152   SDValue ExpandVectorBuildThroughStack(SDNode* Node);
 153
 154   std::pair<SDValue, SDValue> ExpandAtomic(SDNode *Node);
 155
 156   void ExpandNode(SDNode *Node, SmallVectorImpl<SDValue> &Results);
 157   void PromoteNode(SDNode *Node, SmallVectorImpl<SDValue> &Results);
 158
 159   SDValue getLastCALLSEQ() { return LastCALLSEQ.back();  }
 160   void setLastCALLSEQ(const SDValue s) { LastCALLSEQ.back() = s; }
 161   void pushLastCALLSEQ(SDValue s) {
 162     LastCALLSEQ.push_back(s);
 163   }
 164   void popLastCALLSEQ() {
 165     LastCALLSEQ.pop_back();
 166   }
 167 };
 168 }
 169
 170 /// ShuffleWithNarrowerEltType - Return a vector shuffle operation which
 171 /// performs the same shuffe in terms of order or result bytes, but on a type
 172 /// whose vector element type is narrower than the original shuffle type.
 173 /// e.g. <v4i32> <0, 1, 0, 1> -> v8i16 <0, 1, 2, 3, 0, 1, 2, 3>
 174 SDValue
 175 SelectionDAGLegalize::ShuffleWithNarrowerEltType(EVT NVT, EVT VT,  DebugLoc dl,
 176                                                  SDValue N1, SDValue N2,
 177                                              SmallVectorImpl<int> &Mask) const {
 178   unsigned NumMaskElts = VT.getVectorNumElements();
 179   unsigned NumDestElts = NVT.getVectorNumElements();
 180   unsigned NumEltsGrowth = NumDestElts / NumMaskElts;
 181
 182   assert(NumEltsGrowth && "Cannot promote to vector type with fewer elts!");
 183
 184   if (NumEltsGrowth == 1)
 185     return DAG.getVectorShuffle(NVT, dl, N1, N2, &Mask[0]);
 186
 187   SmallVector<int, 8> NewMask;
 188   for (unsigned i = 0; i != NumMaskElts; ++i) {
 189     int Idx = Mask[i];
 190     for (unsigned j = 0; j != NumEltsGrowth; ++j) {
 191       if (Idx < 0)
 192         NewMask.push_back(-1);
 193       else
 194         NewMask.push_back(Idx * NumEltsGrowth + j);
 195     }
 196   }
 197   assert(NewMask.size() == NumDestElts && "Non-integer NumEltsGrowth?");
 198   assert(TLI.isShuffleMaskLegal(NewMask, NVT) && "Shuffle not legal?");
 199   return DAG.getVectorShuffle(NVT, dl, N1, N2, &NewMask[0]);
 200 }
 201
 202 SelectionDAGLegalize::SelectionDAGLegalize(SelectionDAG &dag)
 203   : TM(dag.getTarget()), TLI(dag.getTargetLoweringInfo()),
 204     DAG(dag) {
 205 }
 206
 207 void SelectionDAGLegalize::LegalizeDAG() {
 208   pushLastCALLSEQ(DAG.getEntryNode());
 209
 210   // The legalize process is inherently a bottom-up recursive process (users
 211   // legalize their uses before themselves).  Given infinite stack space, we
 212   // could just start legalizing on the root and traverse the whole graph.  In
 213   // practice however, this causes us to run out of stack space on large basic
 214   // blocks.  To avoid this problem, compute an ordering of the nodes where each
 215   // node is only legalized after all of its operands are legalized.
 216   DAG.AssignTopologicalOrder();
 217   for (SelectionDAG::allnodes_iterator I = DAG.allnodes_begin(),
 218        E = prior(DAG.allnodes_end()); I != llvm::next(E); ++I)
 219     LegalizeOp(SDValue(I, 0));
 220
 221   // Finally, it's possible the root changed.  Get the new root.
 222   SDValue OldRoot = DAG.getRoot();
 223   assert(LegalizedNodes.count(OldRoot) && "Root didn't get legalized?");
 224   DAG.setRoot(LegalizedNodes[OldRoot]);
 225
 226   LegalizedNodes.clear();
 227
 228   // Remove dead nodes now.
 229   DAG.RemoveDeadNodes();
 230 }
 231
 232
 233 /// FindCallEndFromCallStart - Given a chained node that is part of a call
 234 /// sequence, find the CALLSEQ_END node that terminates the call sequence.
 235 static SDNode *FindCallEndFromCallStart(SDNode *Node, int depth = 0) {
 236   int next_depth = depth;
 237   if (Node->getOpcode() == ISD::CALLSEQ_START)
 238     next_depth = depth + 1;
 239   if (Node->getOpcode() == ISD::CALLSEQ_END) {
 240     assert(depth > 0 && "negative depth!");
 241     if (depth == 1)
 242       return Node;
 243     else
 244       next_depth = depth - 1;
 245   }
 246   if (Node->use_empty())
 247     return 0;   // No CallSeqEnd
 248
 249   // The chain is usually at the end.
 250   SDValue TheChain(Node, Node->getNumValues()-1);
 251   if (TheChain.getValueType() != MVT::Other) {
 252     // Sometimes it's at the beginning.
 253     TheChain = SDValue(Node, 0);
 254     if (TheChain.getValueType() != MVT::Other) {
 255       // Otherwise, hunt for it.
 256       for (unsigned i = 1, e = Node->getNumValues(); i != e; ++i)
 257         if (Node->getValueType(i) == MVT::Other) {
 258           TheChain = SDValue(Node, i);
 259           break;
 260         }
 261
 262       // Otherwise, we walked into a node without a chain.
 263       if (TheChain.getValueType() != MVT::Other)
 264         return 0;
 265     }
 266   }
 267
 268   for (SDNode::use_iterator UI = Node->use_begin(),
 269        E = Node->use_end(); UI != E; ++UI) {
 270
 271     // Make sure to only follow users of our token chain.
 272     SDNode *User = *UI;
 273     for (unsigned i = 0, e = User->getNumOperands(); i != e; ++i)
 274       if (User->getOperand(i) == TheChain)
 275         if (SDNode *Result = FindCallEndFromCallStart(User, next_depth))
 276           return Result;
 277   }
 278   return 0;
 279 }
 280
 281 /// FindCallStartFromCallEnd - Given a chained node that is part of a call
 282 /// sequence, find the CALLSEQ_START node that initiates the call sequence.
 283 static SDNode *FindCallStartFromCallEnd(SDNode *Node) {
 284   int nested = 0;
 285   assert(Node && "Didn't find callseq_start for a call??");
 286   while (Node->getOpcode() != ISD::CALLSEQ_START || nested) {
 287     Node = Node->getOperand(0).getNode();
 288     assert(Node->getOperand(0).getValueType() == MVT::Other &&
 289            "Node doesn't have a token chain argument!");
 290     switch (Node->getOpcode()) {
 291     default:
 292       break;
 293     case ISD::CALLSEQ_START:
 294       if (!nested)
 295         return Node;
 296       Node = Node->getOperand(0).getNode();
 297       nested--;
 298       break;
 299     case ISD::CALLSEQ_END:
 300       nested++;
 301       break;
 302     }
 303   }
 304   return (Node->getOpcode() == ISD::CALLSEQ_START) ? Node : 0;
 305 }
 306
 307 /// LegalizeAllNodesNotLeadingTo - Recursively walk the uses of N, looking to
 308 /// see if any uses can reach Dest.  If no dest operands can get to dest,
 309 /// legalize them, legalize ourself, and return false, otherwise, return true.
 310 ///
 311 /// Keep track of the nodes we fine that actually do lead to Dest in
 312 /// NodesLeadingTo.  This avoids retraversing them exponential number of times.
 313 ///
 314 bool SelectionDAGLegalize::LegalizeAllNodesNotLeadingTo(SDNode *N, SDNode *Dest,
 315                                      SmallPtrSet<SDNode*, 32> &NodesLeadingTo) {
 316   if (N == Dest) return true;  // N certainly leads to Dest :)
 317
 318   // If we've already processed this node and it does lead to Dest, there is no
 319   // need to reprocess it.
 320   if (NodesLeadingTo.count(N)) return true;
 321
 322   // If the first result of this node has been already legalized, then it cannot
 323   // reach N.
 324   if (LegalizedNodes.count(SDValue(N, 0))) return false;
 325
 326   // Okay, this node has not already been legalized.  Check and legalize all
 327   // operands.  If none lead to Dest, then we can legalize this node.
 328   bool OperandsLeadToDest = false;
 329   for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i)
 330     OperandsLeadToDest |=     // If an operand leads to Dest, so do we.
 331       LegalizeAllNodesNotLeadingTo(N->getOperand(i).getNode(), Dest,
 332                                    NodesLeadingTo);
 333
 334   if (OperandsLeadToDest) {
 335     NodesLeadingTo.insert(N);
 336     return true;
 337   }
 338
 339   // Okay, this node looks safe, legalize it and return false.
 340   LegalizeOp(SDValue(N, 0));
 341   return false;
 342 }
 343
 344 /// ExpandConstantFP - Expands the ConstantFP node to an integer constant or
 345 /// a load from the constant pool.
 346 static SDValue ExpandConstantFP(ConstantFPSDNode *CFP, bool UseCP,
 347                                 SelectionDAG &DAG, const TargetLowering &TLI) {
 348   bool Extend = false;
 349   DebugLoc dl = CFP->getDebugLoc();
 350
 351   // If a FP immediate is precise when represented as a float and if the
 352   // target can do an extending load from float to double, we put it into
 353   // the constant pool as a float, even if it's is statically typed as a
 354   // double.  This shrinks FP constants and canonicalizes them for targets where
 355   // an FP extending load is the same cost as a normal load (such as on the x87
 356   // fp stack or PPC FP unit).
 357   EVT VT = CFP->getValueType(0);
 358   ConstantFP *LLVMC = const_cast<ConstantFP*>(CFP->getConstantFPValue());
 359   if (!UseCP) {
 360     assert((VT == MVT::f64 || VT == MVT::f32) && "Invalid type expansion");
 361     return DAG.getConstant(LLVMC->getValueAPF().bitcastToAPInt(),
 362                            (VT == MVT::f64) ? MVT::i64 : MVT::i32);
 363   }
 364
 365   EVT OrigVT = VT;
 366   EVT SVT = VT;
 367   while (SVT != MVT::f32) {
 368     SVT = (MVT::SimpleValueType)(SVT.getSimpleVT().SimpleTy - 1);
 369     if (ConstantFPSDNode::isValueValidForType(SVT, CFP->getValueAPF()) &&
 370         // Only do this if the target has a native EXTLOAD instruction from
 371         // smaller type.
 372         TLI.isLoadExtLegal(ISD::EXTLOAD, SVT) &&
 373         TLI.ShouldShrinkFPConstant(OrigVT)) {
 374       const Type *SType = SVT.getTypeForEVT(*DAG.getContext());
 375       LLVMC = cast<ConstantFP>(ConstantExpr::getFPTrunc(LLVMC, SType));
 376       VT = SVT;
 377       Extend = true;
 378     }
 379   }
 380
 381   SDValue CPIdx = DAG.getConstantPool(LLVMC, TLI.getPointerTy());
 382   unsigned Alignment = cast<ConstantPoolSDNode>(CPIdx)->getAlignment();
 383   if (Extend)
 384     return DAG.getExtLoad(ISD::EXTLOAD, dl, OrigVT,
 385                           DAG.getEntryNode(),
 386                           CPIdx, MachinePointerInfo::getConstantPool(),
 387                           VT, false, false, Alignment);
 388   return DAG.getLoad(OrigVT, dl, DAG.getEntryNode(), CPIdx,
 389                      MachinePointerInfo::getConstantPool(), false, false,
 390                      Alignment);
 391 }
 392
 393 /// ExpandUnalignedStore - Expands an unaligned store to 2 half-size stores.
 394 static
 395 SDValue ExpandUnalignedStore(StoreSDNode *ST, SelectionDAG &DAG,
 396                              const TargetLowering &TLI) {
 397   SDValue Chain = ST->getChain();
 398   SDValue Ptr = ST->getBasePtr();
 399   SDValue Val = ST->getValue();
 400   EVT VT = Val.getValueType();
 401   int Alignment = ST->getAlignment();
 402   DebugLoc dl = ST->getDebugLoc();
 403   if (ST->getMemoryVT().isFloatingPoint() ||
 404       ST->getMemoryVT().isVector()) {
 405     EVT intVT = EVT::getIntegerVT(*DAG.getContext(), VT.getSizeInBits());
 406     if (TLI.isTypeLegal(intVT)) {
 407       // Expand to a bitconvert of the value to the integer type of the
 408       // same size, then a (misaligned) int store.
 409       // FIXME: Does not handle truncating floating point stores!
 410       SDValue Result = DAG.getNode(ISD::BITCAST, dl, intVT, Val);
 411       return DAG.getStore(Chain, dl, Result, Ptr, ST->getPointerInfo(),
 412                           ST->isVolatile(), ST->isNonTemporal(), Alignment);
 413     }
 414     // Do a (aligned) store to a stack slot, then copy from the stack slot
 415     // to the final destination using (unaligned) integer loads and stores.
 416     EVT StoredVT = ST->getMemoryVT();
 417     EVT RegVT =
 418       TLI.getRegisterType(*DAG.getContext(),
 419                           EVT::getIntegerVT(*DAG.getContext(),
 420                                             StoredVT.getSizeInBits()));
 421     unsigned StoredBytes = StoredVT.getSizeInBits() / 8;
 422     unsigned RegBytes = RegVT.getSizeInBits() / 8;
 423     unsigned NumRegs = (StoredBytes + RegBytes - 1) / RegBytes;
 424
 425     // Make sure the stack slot is also aligned for the register type.
 426     SDValue StackPtr = DAG.CreateStackTemporary(StoredVT, RegVT);
 427
 428     // Perform the original store, only redirected to the stack slot.
 429     SDValue Store = DAG.getTruncStore(Chain, dl,
 430                                       Val, StackPtr, MachinePointerInfo(),
 431                                       StoredVT, false, false, 0);
 432     SDValue Increment = DAG.getConstant(RegBytes, TLI.getPointerTy());
 433     SmallVector<SDValue, 8> Stores;
 434     unsigned Offset = 0;
 435
 436     // Do all but one copies using the full register width.
 437     for (unsigned i = 1; i < NumRegs; i++) {
 438       // Load one integer register's worth from the stack slot.
 439       SDValue Load = DAG.getLoad(RegVT, dl, Store, StackPtr,
 440                                  MachinePointerInfo(),
 441                                  false, false, 0);
 442       // Store it to the final location.  Remember the store.
 443       Stores.push_back(DAG.getStore(Load.getValue(1), dl, Load, Ptr,
 444                                   ST->getPointerInfo().getWithOffset(Offset),
 445                                     ST->isVolatile(), ST->isNonTemporal(),
 446                                     MinAlign(ST->getAlignment(), Offset)));
 447       // Increment the pointers.
 448       Offset += RegBytes;
 449       StackPtr = DAG.getNode(ISD::ADD, dl, StackPtr.getValueType(), StackPtr,
 450                              Increment);
 451       Ptr = DAG.getNode(ISD::ADD, dl, Ptr.getValueType(), Ptr, Increment);
 452     }
 453
 454     // The last store may be partial.  Do a truncating store.  On big-endian
 455     // machines this requires an extending load from the stack slot to ensure
 456     // that the bits are in the right place.
 457     EVT MemVT = EVT::getIntegerVT(*DAG.getContext(),
 458                                   8 * (StoredBytes - Offset));
 459
 460     // Load from the stack slot.
 461     SDValue Load = DAG.getExtLoad(ISD::EXTLOAD, dl, RegVT, Store, StackPtr,
 462                                   MachinePointerInfo(),
 463                                   MemVT, false, false, 0);
 464
 465     Stores.push_back(DAG.getTruncStore(Load.getValue(1), dl, Load, Ptr,
 466                                        ST->getPointerInfo()
 467                                          .getWithOffset(Offset),
 468                                        MemVT, ST->isVolatile(),
 469                                        ST->isNonTemporal(),
 470                                        MinAlign(ST->getAlignment(), Offset)));
 471     // The order of the stores doesn't matter - say it with a TokenFactor.
 472     return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, &Stores[0],
 473                        Stores.size());
 474   }
 475   assert(ST->getMemoryVT().isInteger() &&
 476          !ST->getMemoryVT().isVector() &&
 477          "Unaligned store of unknown type.");
 478   // Get the half-size VT
 479   EVT NewStoredVT = ST->getMemoryVT().getHalfSizedIntegerVT(*DAG.getContext());
 480   int NumBits = NewStoredVT.getSizeInBits();
 481   int IncrementSize = NumBits / 8;
 482
 483   // Divide the stored value in two parts.
 484   SDValue ShiftAmount = DAG.getConstant(NumBits,
 485                                       TLI.getShiftAmountTy(Val.getValueType()));
 486   SDValue Lo = Val;
 487   SDValue Hi = DAG.getNode(ISD::SRL, dl, VT, Val, ShiftAmount);
 488
 489   // Store the two parts
 490   SDValue Store1, Store2;
 491   Store1 = DAG.getTruncStore(Chain, dl, TLI.isLittleEndian()?Lo:Hi, Ptr,
 492                              ST->getPointerInfo(), NewStoredVT,
 493                              ST->isVolatile(), ST->isNonTemporal(), Alignment);
 494   Ptr = DAG.getNode(ISD::ADD, dl, Ptr.getValueType(), Ptr,
 495                     DAG.getConstant(IncrementSize, TLI.getPointerTy()));
 496   Alignment = MinAlign(Alignment, IncrementSize);
 497   Store2 = DAG.getTruncStore(Chain, dl, TLI.isLittleEndian()?Hi:Lo, Ptr,
 498                              ST->getPointerInfo().getWithOffset(IncrementSize),
 499                              NewStoredVT, ST->isVolatile(), ST->isNonTemporal(),
 500                              Alignment);
 501
 502   return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Store1, Store2);
 503 }
 504
 505 /// ExpandUnalignedLoad - Expands an unaligned load to 2 half-size loads.
 506 static
 507 SDValue ExpandUnalignedLoad(LoadSDNode *LD, SelectionDAG &DAG,
 508                             const TargetLowering &TLI) {
 509   SDValue Chain = LD->getChain();
 510   SDValue Ptr = LD->getBasePtr();
 511   EVT VT = LD->getValueType(0);
 512   EVT LoadedVT = LD->getMemoryVT();
 513   DebugLoc dl = LD->getDebugLoc();
 514   if (VT.isFloatingPoint() || VT.isVector()) {
 515     EVT intVT = EVT::getIntegerVT(*DAG.getContext(), LoadedVT.getSizeInBits());
 516     if (TLI.isTypeLegal(intVT)) {
 517       // Expand to a (misaligned) integer load of the same size,
 518       // then bitconvert to floating point or vector.
 519       SDValue newLoad = DAG.getLoad(intVT, dl, Chain, Ptr, LD->getPointerInfo(),
 520                                     LD->isVolatile(),
 521                                     LD->isNonTemporal(), LD->getAlignment());
 522       SDValue Result = DAG.getNode(ISD::BITCAST, dl, LoadedVT, newLoad);
 523       if (VT.isFloatingPoint() && LoadedVT != VT)
 524         Result = DAG.getNode(ISD::FP_EXTEND, dl, VT, Result);
 525
 526       SDValue Ops[] = { Result, Chain };
 527       return DAG.getMergeValues(Ops, 2, dl);
 528     }
 529
 530     // Copy the value to a (aligned) stack slot using (unaligned) integer
 531     // loads and stores, then do a (aligned) load from the stack slot.
 532     EVT RegVT = TLI.getRegisterType(*DAG.getContext(), intVT);
 533     unsigned LoadedBytes = LoadedVT.getSizeInBits() / 8;
 534     unsigned RegBytes = RegVT.getSizeInBits() / 8;
 535     unsigned NumRegs = (LoadedBytes + RegBytes - 1) / RegBytes;
 536
 537     // Make sure the stack slot is also aligned for the register type.
 538     SDValue StackBase = DAG.CreateStackTemporary(LoadedVT, RegVT);
 539
 540     SDValue Increment = DAG.getConstant(RegBytes, TLI.getPointerTy());
 541     SmallVector<SDValue, 8> Stores;
 542     SDValue StackPtr = StackBase;
 543     unsigned Offset = 0;
 544
 545     // Do all but one copies using the full register width.
 546     for (unsigned i = 1; i < NumRegs; i++) {
 547       // Load one integer register's worth from the original location.
 548       SDValue Load = DAG.getLoad(RegVT, dl, Chain, Ptr,
 549                                  LD->getPointerInfo().getWithOffset(Offset),
 550                                  LD->isVolatile(), LD->isNonTemporal(),
 551                                  MinAlign(LD->getAlignment(), Offset));
 552       // Follow the load with a store to the stack slot.  Remember the store.
 553       Stores.push_back(DAG.getStore(Load.getValue(1), dl, Load, StackPtr,
 554                                     MachinePointerInfo(), false, false, 0));
 555       // Increment the pointers.
 556       Offset += RegBytes;
 557       Ptr = DAG.getNode(ISD::ADD, dl, Ptr.getValueType(), Ptr, Increment);
 558       StackPtr = DAG.getNode(ISD::ADD, dl, StackPtr.getValueType(), StackPtr,
 559                              Increment);
 560     }
 561
 562     // The last copy may be partial.  Do an extending load.
 563     EVT MemVT = EVT::getIntegerVT(*DAG.getContext(),
 564                                   8 * (LoadedBytes - Offset));
 565     SDValue Load = DAG.getExtLoad(ISD::EXTLOAD, dl, RegVT, Chain, Ptr,
 566                                   LD->getPointerInfo().getWithOffset(Offset),
 567                                   MemVT, LD->isVolatile(),
 568                                   LD->isNonTemporal(),
 569                                   MinAlign(LD->getAlignment(), Offset));
 570     // Follow the load with a store to the stack slot.  Remember the store.
 571     // On big-endian machines this requires a truncating store to ensure
 572     // that the bits end up in the right place.
 573     Stores.push_back(DAG.getTruncStore(Load.getValue(1), dl, Load, StackPtr,
 574                                        MachinePointerInfo(), MemVT,
 575                                        false, false, 0));
 576
 577     // The order of the stores doesn't matter - say it with a TokenFactor.
 578     SDValue TF = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, &Stores[0],
 579                              Stores.size());
 580
 581     // Finally, perform the original load only redirected to the stack slot.
 582     Load = DAG.getExtLoad(LD->getExtensionType(), dl, VT, TF, StackBase,
 583                           MachinePointerInfo(), LoadedVT, false, false, 0);
 584
 585     // Callers expect a MERGE_VALUES node.
 586     SDValue Ops[] = { Load, TF };
 587     return DAG.getMergeValues(Ops, 2, dl);
 588   }
 589   assert(LoadedVT.isInteger() && !LoadedVT.isVector() &&
 590          "Unaligned load of unsupported type.");
 591
 592   // Compute the new VT that is half the size of the old one.  This is an
 593   // integer MVT.
 594   unsigned NumBits = LoadedVT.getSizeInBits();
 595   EVT NewLoadedVT;
 596   NewLoadedVT = EVT::getIntegerVT(*DAG.getContext(), NumBits/2);
 597   NumBits >>= 1;
 598
 599   unsigned Alignment = LD->getAlignment();
 600   unsigned IncrementSize = NumBits / 8;
 601   ISD::LoadExtType HiExtType = LD->getExtensionType();
 602
 603   // If the original load is NON_EXTLOAD, the hi part load must be ZEXTLOAD.
 604   if (HiExtType == ISD::NON_EXTLOAD)
 605     HiExtType = ISD::ZEXTLOAD;
 606
 607   // Load the value in two parts
 608   SDValue Lo, Hi;
 609   if (TLI.isLittleEndian()) {
 610     Lo = DAG.getExtLoad(ISD::ZEXTLOAD, dl, VT, Chain, Ptr, LD->getPointerInfo(),
 611                         NewLoadedVT, LD->isVolatile(),
 612                         LD->isNonTemporal(), Alignment);
 613     Ptr = DAG.getNode(ISD::ADD, dl, Ptr.getValueType(), Ptr,
 614                       DAG.getConstant(IncrementSize, TLI.getPointerTy()));
 615     Hi = DAG.getExtLoad(HiExtType, dl, VT, Chain, Ptr,
 616                         LD->getPointerInfo().getWithOffset(IncrementSize),
 617                         NewLoadedVT, LD->isVolatile(),
 618                         LD->isNonTemporal(), MinAlign(Alignment,IncrementSize));
 619   } else {
 620     Hi = DAG.getExtLoad(HiExtType, dl, VT, Chain, Ptr, LD->getPointerInfo(),
 621                         NewLoadedVT, LD->isVolatile(),
 622                         LD->isNonTemporal(), Alignment);
 623     Ptr = DAG.getNode(ISD::ADD, dl, Ptr.getValueType(), Ptr,
 624                       DAG.getConstant(IncrementSize, TLI.getPointerTy()));
 625     Lo = DAG.getExtLoad(ISD::ZEXTLOAD, dl, VT, Chain, Ptr,
 626                         LD->getPointerInfo().getWithOffset(IncrementSize),
 627                         NewLoadedVT, LD->isVolatile(),
 628                         LD->isNonTemporal(), MinAlign(Alignment,IncrementSize));
 629   }
 630
 631   // aggregate the two parts
 632   SDValue ShiftAmount = DAG.getConstant(NumBits,
 633                                        TLI.getShiftAmountTy(Hi.getValueType()));
 634   SDValue Result = DAG.getNode(ISD::SHL, dl, VT, Hi, ShiftAmount);
 635   Result = DAG.getNode(ISD::OR, dl, VT, Result, Lo);
 636
 637   SDValue TF = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(1),
 638                              Hi.getValue(1));
 639
 640   SDValue Ops[] = { Result, TF };
 641   return DAG.getMergeValues(Ops, 2, dl);
 642 }
 643
 644 /// PerformInsertVectorEltInMemory - Some target cannot handle a variable
 645 /// insertion index for the INSERT_VECTOR_ELT instruction.  In this case, it
 646 /// is necessary to spill the vector being inserted into to memory, perform
 647 /// the insert there, and then read the result back.
 648 SDValue SelectionDAGLegalize::
 649 PerformInsertVectorEltInMemory(SDValue Vec, SDValue Val, SDValue Idx,
 650                                DebugLoc dl) {
 651   SDValue Tmp1 = Vec;
 652   SDValue Tmp2 = Val;
 653   SDValue Tmp3 = Idx;
 654
 655   // If the target doesn't support this, we have to spill the input vector
 656   // to a temporary stack slot, update the element, then reload it.  This is
 657   // badness.  We could also load the value into a vector register (either
 658   // with a "move to register" or "extload into register" instruction, then
 659   // permute it into place, if the idx is a constant and if the idx is
 660   // supported by the target.
 661   EVT VT    = Tmp1.getValueType();
 662   EVT EltVT = VT.getVectorElementType();
 663   EVT IdxVT = Tmp3.getValueType();
 664   EVT PtrVT = TLI.getPointerTy();
 665   SDValue StackPtr = DAG.CreateStackTemporary(VT);
 666
 667   int SPFI = cast<FrameIndexSDNode>(StackPtr.getNode())->getIndex();
 668
 669   // Store the vector.
 670   SDValue Ch = DAG.getStore(DAG.getEntryNode(), dl, Tmp1, StackPtr,
 671                             MachinePointerInfo::getFixedStack(SPFI),
 672                             false, false, 0);
 673
 674   // Truncate or zero extend offset to target pointer type.
 675   unsigned CastOpc = IdxVT.bitsGT(PtrVT) ? ISD::TRUNCATE : ISD::ZERO_EXTEND;
 676   Tmp3 = DAG.getNode(CastOpc, dl, PtrVT, Tmp3);
 677   // Add the offset to the index.
 678   unsigned EltSize = EltVT.getSizeInBits()/8;
 679   Tmp3 = DAG.getNode(ISD::MUL, dl, IdxVT, Tmp3,DAG.getConstant(EltSize, IdxVT));
 680   SDValue StackPtr2 = DAG.getNode(ISD::ADD, dl, IdxVT, Tmp3, StackPtr);
 681   // Store the scalar value.
 682   Ch = DAG.getTruncStore(Ch, dl, Tmp2, StackPtr2, MachinePointerInfo(), EltVT,
 683                          false, false, 0);
 684   // Load the updated vector.
 685   return DAG.getLoad(VT, dl, Ch, StackPtr,
 686                      MachinePointerInfo::getFixedStack(SPFI), false, false, 0);
 687 }
 688
 689
 690 SDValue SelectionDAGLegalize::
 691 ExpandINSERT_VECTOR_ELT(SDValue Vec, SDValue Val, SDValue Idx, DebugLoc dl) {
 692   if (ConstantSDNode *InsertPos = dyn_cast<ConstantSDNode>(Idx)) {
 693     // SCALAR_TO_VECTOR requires that the type of the value being inserted
 694     // match the element type of the vector being created, except for
 695     // integers in which case the inserted value can be over width.
 696     EVT EltVT = Vec.getValueType().getVectorElementType();
 697     if (Val.getValueType() == EltVT ||
 698         (EltVT.isInteger() && Val.getValueType().bitsGE(EltVT))) {
 699       SDValue ScVec = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl,
 700                                   Vec.getValueType(), Val);
 701
 702       unsigned NumElts = Vec.getValueType().getVectorNumElements();
 703       // We generate a shuffle of InVec and ScVec, so the shuffle mask
 704       // should be 0,1,2,3,4,5... with the appropriate element replaced with
 705       // elt 0 of the RHS.
 706       SmallVector<int, 8> ShufOps;
 707       for (unsigned i = 0; i != NumElts; ++i)
 708         ShufOps.push_back(i != InsertPos->getZExtValue() ? i : NumElts);
 709
 710       return DAG.getVectorShuffle(Vec.getValueType(), dl, Vec, ScVec,
 711                                   &ShufOps[0]);
 712     }
 713   }
 714   return PerformInsertVectorEltInMemory(Vec, Val, Idx, dl);
 715 }
 716
 717 SDValue SelectionDAGLegalize::OptimizeFloatStore(StoreSDNode* ST) {
 718   // Turn 'store float 1.0, Ptr' -> 'store int 0x12345678, Ptr'
 719   // FIXME: We shouldn't do this for TargetConstantFP's.
 720   // FIXME: move this to the DAG Combiner!  Note that we can't regress due
 721   // to phase ordering between legalized code and the dag combiner.  This
 722   // probably means that we need to integrate dag combiner and legalizer
 723   // together.
 724   // We generally can't do this one for long doubles.
 725   SDValue Tmp1 = ST->getChain();
 726   SDValue Tmp2 = ST->getBasePtr();
 727   SDValue Tmp3;
 728   unsigned Alignment = ST->getAlignment();
 729   bool isVolatile = ST->isVolatile();
 730   bool isNonTemporal = ST->isNonTemporal();
 731   DebugLoc dl = ST->getDebugLoc();
 732   if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(ST->getValue())) {
 733     if (CFP->getValueType(0) == MVT::f32 &&
 734         TLI.isTypeLegal(MVT::i32)) {
 735       Tmp3 = DAG.getConstant(CFP->getValueAPF().
 736                                       bitcastToAPInt().zextOrTrunc(32),
 737                               MVT::i32);
 738       return DAG.getStore(Tmp1, dl, Tmp3, Tmp2, ST->getPointerInfo(),
 739                           isVolatile, isNonTemporal, Alignment);
 740     }
 741
 742     if (CFP->getValueType(0) == MVT::f64) {
 743       // If this target supports 64-bit registers, do a single 64-bit store.
 744       if (TLI.isTypeLegal(MVT::i64)) {
 745         Tmp3 = DAG.getConstant(CFP->getValueAPF().bitcastToAPInt().
 746                                   zextOrTrunc(64), MVT::i64);
 747         return DAG.getStore(Tmp1, dl, Tmp3, Tmp2, ST->getPointerInfo(),
 748                             isVolatile, isNonTemporal, Alignment);
 749       }
 750
 751       if (TLI.isTypeLegal(MVT::i32) && !ST->isVolatile()) {
 752         // Otherwise, if the target supports 32-bit registers, use 2 32-bit
 753         // stores.  If the target supports neither 32- nor 64-bits, this
 754         // xform is certainly not worth it.
 755         const APInt &IntVal =CFP->getValueAPF().bitcastToAPInt();
 756         SDValue Lo = DAG.getConstant(IntVal.trunc(32), MVT::i32);
 757         SDValue Hi = DAG.getConstant(IntVal.lshr(32).trunc(32), MVT::i32);
 758         if (TLI.isBigEndian()) std::swap(Lo, Hi);
 759
 760         Lo = DAG.getStore(Tmp1, dl, Lo, Tmp2, ST->getPointerInfo(), isVolatile,
 761                           isNonTemporal, Alignment);
 762         Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
 763                             DAG.getIntPtrConstant(4));
 764         Hi = DAG.getStore(Tmp1, dl, Hi, Tmp2,
 765                           ST->getPointerInfo().getWithOffset(4),
 766                           isVolatile, isNonTemporal, MinAlign(Alignment, 4U));
 767
 768         return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo, Hi);
 769       }
 770     }
 771   }
 772   return SDValue(0, 0);
 773 }
 774
 775 /// LegalizeOp - Return a legal replacement for the given operation, with
 776 /// all legal operands.
 777 SDValue SelectionDAGLegalize::LegalizeOp(SDValue Op) {
 778   if (Op.getOpcode() == ISD::TargetConstant) // Allow illegal target nodes.
 779     return Op;
 780
 781   SDNode *Node = Op.getNode();
 782   DebugLoc dl = Node->getDebugLoc();
 783
 784   for (unsigned i = 0, e = Node->getNumValues(); i != e; ++i)
 785     assert(TLI.getTypeAction(*DAG.getContext(), Node->getValueType(i)) ==
 786              TargetLowering::TypeLegal &&
 787            "Unexpected illegal type!");
 788
 789   for (unsigned i = 0, e = Node->getNumOperands(); i != e; ++i)
 790     assert((TLI.getTypeAction(*DAG.getContext(),
 791                               Node->getOperand(i).getValueType()) ==
 792               TargetLowering::TypeLegal ||
 793             Node->getOperand(i).getOpcode() == ISD::TargetConstant) &&
 794            "Unexpected illegal type!");
 795
 796   // Note that LegalizeOp may be reentered even from single-use nodes, which
 797   // means that we always must cache transformed nodes.
 798   DenseMap<SDValue, SDValue>::iterator I = LegalizedNodes.find(Op);
 799   if (I != LegalizedNodes.end()) return I->second;
 800
 801   SDValue Tmp1, Tmp2, Tmp3, Tmp4;
 802   SDValue Result = Op;
 803   bool isCustom = false;
 804
 805   // Figure out the correct action; the way to query this varies by opcode
 806   TargetLowering::LegalizeAction Action = TargetLowering::Legal;
 807   bool SimpleFinishLegalizing = true;
 808   switch (Node->getOpcode()) {
 809   case ISD::INTRINSIC_W_CHAIN:
 810   case ISD::INTRINSIC_WO_CHAIN:
 811   case ISD::INTRINSIC_VOID:
 812   case ISD::VAARG:
 813   case ISD::STACKSAVE:
 814     Action = TLI.getOperationAction(Node->getOpcode(), MVT::Other);
 815     break;
 816   case ISD::SINT_TO_FP:
 817   case ISD::UINT_TO_FP:
 818   case ISD::EXTRACT_VECTOR_ELT:
 819     Action = TLI.getOperationAction(Node->getOpcode(),
 820                                     Node->getOperand(0).getValueType());
 821     break;
 822   case ISD::FP_ROUND_INREG:
 823   case ISD::SIGN_EXTEND_INREG: {
 824     EVT InnerType = cast<VTSDNode>(Node->getOperand(1))->getVT();
 825     Action = TLI.getOperationAction(Node->getOpcode(), InnerType);
 826     break;
 827   }
 828   case ISD::SELECT_CC:
 829   case ISD::SETCC:
 830   case ISD::BR_CC: {
 831     unsigned CCOperand = Node->getOpcode() == ISD::SELECT_CC ? 4 :
 832                          Node->getOpcode() == ISD::SETCC ? 2 : 1;
 833     unsigned CompareOperand = Node->getOpcode() == ISD::BR_CC ? 2 : 0;
 834     EVT OpVT = Node->getOperand(CompareOperand).getValueType();
 835     ISD::CondCode CCCode =
 836         cast<CondCodeSDNode>(Node->getOperand(CCOperand))->get();
 837     Action = TLI.getCondCodeAction(CCCode, OpVT);
 838     if (Action == TargetLowering::Legal) {
 839       if (Node->getOpcode() == ISD::SELECT_CC)
 840         Action = TLI.getOperationAction(Node->getOpcode(),
 841                                         Node->getValueType(0));
 842       else
 843         Action = TLI.getOperationAction(Node->getOpcode(), OpVT);
 844     }
 845     break;
 846   }
 847   case ISD::LOAD:
 848   case ISD::STORE:
 849     // FIXME: Model these properly.  LOAD and STORE are complicated, and
 850     // STORE expects the unlegalized operand in some cases.
 851     SimpleFinishLegalizing = false;
 852     break;
 853   case ISD::CALLSEQ_START:
 854   case ISD::CALLSEQ_END:
 855     // FIXME: This shouldn't be necessary.  These nodes have special properties
 856     // dealing with the recursive nature of legalization.  Removing this
 857     // special case should be done as part of making LegalizeDAG non-recursive.
 858     SimpleFinishLegalizing = false;
 859     break;
 860   case ISD::EXTRACT_ELEMENT:
 861   case ISD::FLT_ROUNDS_:
 862   case ISD::SADDO:
 863   case ISD::SSUBO:
 864   case ISD::UADDO:
 865   case ISD::USUBO:
 866   case ISD::SMULO:
 867   case ISD::UMULO:
 868   case ISD::FPOWI:
 869   case ISD::MERGE_VALUES:
 870   case ISD::EH_RETURN:
 871   case ISD::FRAME_TO_ARGS_OFFSET:
 872   case ISD::EH_SJLJ_SETJMP:
 873   case ISD::EH_SJLJ_LONGJMP:
 874   case ISD::EH_SJLJ_DISPATCHSETUP:
 875     // These operations lie about being legal: when they claim to be legal,
 876     // they should actually be expanded.
 877     Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
 878     if (Action == TargetLowering::Legal)
 879       Action = TargetLowering::Expand;
 880     break;
 881   case ISD::TRAMPOLINE:
 882   case ISD::FRAMEADDR:
 883   case ISD::RETURNADDR:
 884     // These operations lie about being legal: when they claim to be legal,
 885     // they should actually be custom-lowered.
 886     Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
 887     if (Action == TargetLowering::Legal)
 888       Action = TargetLowering::Custom;
 889     break;
 890   case ISD::BUILD_VECTOR:
 891     // A weird case: legalization for BUILD_VECTOR never legalizes the
 892     // operands!
 893     // FIXME: This really sucks... changing it isn't semantically incorrect,
 894     // but it massively pessimizes the code for floating-point BUILD_VECTORs
 895     // because ConstantFP operands get legalized into constant pool loads
 896     // before the BUILD_VECTOR code can see them.  It doesn't usually bite,
 897     // though, because BUILD_VECTORS usually get lowered into other nodes
 898     // which get legalized properly.
 899     SimpleFinishLegalizing = false;
 900     break;
 901   default:
 902     if (Node->getOpcode() >= ISD::BUILTIN_OP_END) {
 903       Action = TargetLowering::Legal;
 904     } else {
 905       Action = TLI.getOperationAction(Node->getOpcode(), Node->getValueType(0));
 906     }
 907     break;
 908   }
 909
 910   if (SimpleFinishLegalizing) {
 911     SmallVector<SDValue, 8> Ops, ResultVals;
 912     for (unsigned i = 0, e = Node->getNumOperands(); i != e; ++i)
 913       Ops.push_back(LegalizeOp(Node->getOperand(i)));
 914     switch (Node->getOpcode()) {
 915     default: break;
 916     case ISD::BR:
 917     case ISD::BRIND:
 918     case ISD::BR_JT:
 919     case ISD::BR_CC:
 920     case ISD::BRCOND:
 921       assert(LastCALLSEQ.size() == 1 && "branch inside CALLSEQ_BEGIN/END?");
 922       // Branches tweak the chain to include LastCALLSEQ
 923       Ops[0] = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Ops[0],
 924                            getLastCALLSEQ());
 925       Ops[0] = LegalizeOp(Ops[0]);
 926       setLastCALLSEQ(DAG.getEntryNode());
 927       break;
 928     case ISD::SHL:
 929     case ISD::SRL:
 930     case ISD::SRA:
 931     case ISD::ROTL:
 932     case ISD::ROTR:
 933       // Legalizing shifts/rotates requires adjusting the shift amount
 934       // to the appropriate width.
 935       if (!Ops[1].getValueType().isVector())
 936         Ops[1] = LegalizeOp(DAG.getShiftAmountOperand(Ops[0].getValueType(),
 937                                                       Ops[1]));
 938       break;
 939     case ISD::SRL_PARTS:
 940     case ISD::SRA_PARTS:
 941     case ISD::SHL_PARTS:
 942       // Legalizing shifts/rotates requires adjusting the shift amount
 943       // to the appropriate width.
 944       if (!Ops[2].getValueType().isVector())
 945         Ops[2] = LegalizeOp(DAG.getShiftAmountOperand(Ops[0].getValueType(),
 946                                                       Ops[2]));
 947       break;
 948     }
 949
 950     Result = SDValue(DAG.UpdateNodeOperands(Result.getNode(), Ops.data(),
 951                                             Ops.size()), 0);
 952     switch (Action) {
 953     case TargetLowering::Legal:
 954       for (unsigned i = 0, e = Node->getNumValues(); i != e; ++i)
 955         ResultVals.push_back(Result.getValue(i));
 956       break;
 957     case TargetLowering::Custom:
 958       // FIXME: The handling for custom lowering with multiple results is
 959       // a complete mess.
 960       Tmp1 = TLI.LowerOperation(Result, DAG);
 961       if (Tmp1.getNode()) {
 962         for (unsigned i = 0, e = Node->getNumValues(); i != e; ++i) {
 963           if (e == 1)
 964             ResultVals.push_back(Tmp1);
 965           else
 966             ResultVals.push_back(Tmp1.getValue(i));
 967         }
 968         break;
 969       }
 970
 971       // FALL THROUGH
 972     case TargetLowering::Expand:
 973       ExpandNode(Result.getNode(), ResultVals);
 974       break;
 975     case TargetLowering::Promote:
 976       PromoteNode(Result.getNode(), ResultVals);
 977       break;
 978     }
 979     if (!ResultVals.empty()) {
 980       for (unsigned i = 0, e = ResultVals.size(); i != e; ++i) {
 981         if (ResultVals[i] != SDValue(Node, i))
 982           ResultVals[i] = LegalizeOp(ResultVals[i]);
 983         AddLegalizedOperand(SDValue(Node, i), ResultVals[i]);
 984       }
 985       return ResultVals[Op.getResNo()];
 986     }
 987   }
 988
 989   switch (Node->getOpcode()) {
 990   default:
 991 #ifndef NDEBUG
 992     dbgs() << "NODE: ";
 993     Node->dump( &DAG);
 994     dbgs() << "\n";
 995 #endif
 996     assert(0 && "Do not know how to legalize this operator!");
 997
 998   case ISD::BUILD_VECTOR:
 999     switch (TLI.getOperationAction(ISD::BUILD_VECTOR, Node->getValueType(0))) {
1000     default: assert(0 && "This action is not supported yet!");
1001     case TargetLowering::Custom:
1002       Tmp3 = TLI.LowerOperation(Result, DAG);
1003       if (Tmp3.getNode()) {
1004         Result = Tmp3;
1005         break;
1006       }
1007       // FALLTHROUGH
1008     case TargetLowering::Expand:
1009       Result = ExpandBUILD_VECTOR(Result.getNode());
1010       break;
1011     }
1012     break;
1013   case ISD::CALLSEQ_START: {
1014     SDNode *CallEnd = FindCallEndFromCallStart(Node);
1015     assert(CallEnd && "didn't find CALLSEQ_END!");
1016
1017     // Recursively Legalize all of the inputs of the call end that do not lead
1018     // to this call start.  This ensures that any libcalls that need be inserted
1019     // are inserted *before* the CALLSEQ_START.
1020     {SmallPtrSet<SDNode*, 32> NodesLeadingTo;
1021     for (unsigned i = 0, e = CallEnd->getNumOperands(); i != e; ++i)
1022       LegalizeAllNodesNotLeadingTo(CallEnd->getOperand(i).getNode(), Node,
1023                                    NodesLeadingTo);
1024     }
1025
1026     // Now that we have legalized all of the inputs (which may have inserted
1027     // libcalls), create the new CALLSEQ_START node.
1028     Tmp1 = LegalizeOp(Node->getOperand(0));  // Legalize the chain.
1029
1030     // Merge in the last call to ensure that this call starts after the last
1031     // call ended.
1032     if (getLastCALLSEQ().getOpcode() != ISD::EntryToken) {
1033       Tmp1 = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1034                          Tmp1, getLastCALLSEQ());
1035       Tmp1 = LegalizeOp(Tmp1);
1036     }
1037
1038     // Do not try to legalize the target-specific arguments (#1+).
1039     if (Tmp1 != Node->getOperand(0)) {
1040       SmallVector<SDValue, 8> Ops(Node->op_begin(), Node->op_end());
1041       Ops[0] = Tmp1;
1042       Result = SDValue(DAG.UpdateNodeOperands(Result.getNode(), &Ops[0],
1043                                               Ops.size()), Result.getResNo());
1044     }
1045
1046     // Remember that the CALLSEQ_START is legalized.
1047     AddLegalizedOperand(Op.getValue(0), Result);
1048     if (Node->getNumValues() == 2)    // If this has a flag result, remember it.
1049       AddLegalizedOperand(Op.getValue(1), Result.getValue(1));
1050
1051     // Now that the callseq_start and all of the non-call nodes above this call
1052     // sequence have been legalized, legalize the call itself.  During this
1053     // process, no libcalls can/will be inserted, guaranteeing that no calls
1054     // can overlap.
1055     // Note that we are selecting this call!
1056     setLastCALLSEQ(SDValue(CallEnd, 0));
1057
1058     // Legalize the call, starting from the CALLSEQ_END.
1059     LegalizeOp(getLastCALLSEQ());
1060     return Result;
1061   }
1062   case ISD::CALLSEQ_END:
1063     {
1064       SDNode *myCALLSEQ_BEGIN = FindCallStartFromCallEnd(Node);
1065
1066       // If the CALLSEQ_START node hasn't been legalized first, legalize it.
1067       // This will cause this node to be legalized as well as handling libcalls
1068       // right.
1069       if (getLastCALLSEQ().getNode() != Node) {
1070         LegalizeOp(SDValue(myCALLSEQ_BEGIN, 0));
1071         DenseMap<SDValue, SDValue>::iterator I = LegalizedNodes.find(Op);
1072         assert(I != LegalizedNodes.end() &&
1073                "Legalizing the call start should have legalized this node!");
1074         return I->second;
1075       }
1076
1077       pushLastCALLSEQ(SDValue(myCALLSEQ_BEGIN, 0));
1078     }
1079
1080     // Otherwise, the call start has been legalized and everything is going
1081     // according to plan.  Just legalize ourselves normally here.
1082     Tmp1 = LegalizeOp(Node->getOperand(0));  // Legalize the chain.
1083     // Do not try to legalize the target-specific arguments (#1+), except for
1084     // an optional flag input.
1085     if (Node->getOperand(Node->getNumOperands()-1).getValueType() != MVT::Glue){
1086       if (Tmp1 != Node->getOperand(0)) {
1087         SmallVector<SDValue, 8> Ops(Node->op_begin(), Node->op_end());
1088         Ops[0] = Tmp1;
1089         Result = SDValue(DAG.UpdateNodeOperands(Result.getNode(),
1090                                                 &Ops[0], Ops.size()),
1091                          Result.getResNo());
1092       }
1093     } else {
1094       Tmp2 = LegalizeOp(Node->getOperand(Node->getNumOperands()-1));
1095       if (Tmp1 != Node->getOperand(0) ||
1096           Tmp2 != Node->getOperand(Node->getNumOperands()-1)) {
1097         SmallVector<SDValue, 8> Ops(Node->op_begin(), Node->op_end());
1098         Ops[0] = Tmp1;
1099         Ops.back() = Tmp2;
1100         Result = SDValue(DAG.UpdateNodeOperands(Result.getNode(),
1101                                                 &Ops[0], Ops.size()),
1102                          Result.getResNo());
1103       }
1104     }
1105     // This finishes up call legalization.
1106     popLastCALLSEQ();
1107
1108     // If the CALLSEQ_END node has a flag, remember that we legalized it.
1109     AddLegalizedOperand(SDValue(Node, 0), Result.getValue(0));
1110     if (Node->getNumValues() == 2)
1111       AddLegalizedOperand(SDValue(Node, 1), Result.getValue(1));
1112     return Result.getValue(Op.getResNo());
1113   case ISD::LOAD: {
1114     LoadSDNode *LD = cast<LoadSDNode>(Node);
1115     Tmp1 = LegalizeOp(LD->getChain());   // Legalize the chain.
1116     Tmp2 = LegalizeOp(LD->getBasePtr()); // Legalize the base pointer.
1117
1118     ISD::LoadExtType ExtType = LD->getExtensionType();
1119     if (ExtType == ISD::NON_EXTLOAD) {
1120       EVT VT = Node->getValueType(0);
1121       Result = SDValue(DAG.UpdateNodeOperands(Result.getNode(),
1122                                               Tmp1, Tmp2, LD->getOffset()),
1123                        Result.getResNo());
1124       Tmp3 = Result.getValue(0);
1125       Tmp4 = Result.getValue(1);
1126
1127       switch (TLI.getOperationAction(Node->getOpcode(), VT)) {
1128       default: assert(0 && "This action is not supported yet!");
1129       case TargetLowering::Legal:
1130         // If this is an unaligned load and the target doesn't support it,
1131         // expand it.
1132         if (!TLI.allowsUnalignedMemoryAccesses(LD->getMemoryVT())) {
1133           const Type *Ty = LD->getMemoryVT().getTypeForEVT(*DAG.getContext());
1134           unsigned ABIAlignment = TLI.getTargetData()->getABITypeAlignment(Ty);
1135           if (LD->getAlignment() < ABIAlignment){
1136             Result = ExpandUnalignedLoad(cast<LoadSDNode>(Result.getNode()),
1137                                          DAG, TLI);
1138             Tmp3 = Result.getOperand(0);
1139             Tmp4 = Result.getOperand(1);
1140             Tmp3 = LegalizeOp(Tmp3);
1141             Tmp4 = LegalizeOp(Tmp4);
1142           }
1143         }
1144         break;
1145       case TargetLowering::Custom:
1146         Tmp1 = TLI.LowerOperation(Tmp3, DAG);
1147         if (Tmp1.getNode()) {
1148           Tmp3 = LegalizeOp(Tmp1);
1149           Tmp4 = LegalizeOp(Tmp1.getValue(1));
1150         }
1151         break;
1152       case TargetLowering::Promote: {
1153         // Only promote a load of vector type to another.
1154         assert(VT.isVector() && "Cannot promote this load!");
1155         // Change base type to a different vector type.
1156         EVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), VT);
1157
1158         Tmp1 = DAG.getLoad(NVT, dl, Tmp1, Tmp2, LD->getPointerInfo(),
1159                            LD->isVolatile(), LD->isNonTemporal(),
1160                            LD->getAlignment());
1161         Tmp3 = LegalizeOp(DAG.getNode(ISD::BITCAST, dl, VT, Tmp1));
1162         Tmp4 = LegalizeOp(Tmp1.getValue(1));
1163         break;
1164       }
1165       }
1166       // Since loads produce two values, make sure to remember that we
1167       // legalized both of them.
1168       AddLegalizedOperand(SDValue(Node, 0), Tmp3);
1169       AddLegalizedOperand(SDValue(Node, 1), Tmp4);
1170       return Op.getResNo() ? Tmp4 : Tmp3;
1171     }
1172
1173     EVT SrcVT = LD->getMemoryVT();
1174     unsigned SrcWidth = SrcVT.getSizeInBits();
1175     unsigned Alignment = LD->getAlignment();
1176     bool isVolatile = LD->isVolatile();
1177     bool isNonTemporal = LD->isNonTemporal();
1178
1179     if (SrcWidth != SrcVT.getStoreSizeInBits() &&
1180         // Some targets pretend to have an i1 loading operation, and actually
1181         // load an i8.  This trick is correct for ZEXTLOAD because the top 7
1182         // bits are guaranteed to be zero; it helps the optimizers understand
1183         // that these bits are zero.  It is also useful for EXTLOAD, since it
1184         // tells the optimizers that those bits are undefined.  It would be
1185         // nice to have an effective generic way of getting these benefits...
1186         // Until such a way is found, don't insist on promoting i1 here.
1187         (SrcVT != MVT::i1 ||
1188          TLI.getLoadExtAction(ExtType, MVT::i1) == TargetLowering::Promote)) {
1189       // Promote to a byte-sized load if not loading an integral number of
1190       // bytes.  For example, promote EXTLOAD:i20 -> EXTLOAD:i24.
1191       unsigned NewWidth = SrcVT.getStoreSizeInBits();
1192       EVT NVT = EVT::getIntegerVT(*DAG.getContext(), NewWidth);
1193       SDValue Ch;
1194
1195       // The extra bits are guaranteed to be zero, since we stored them that
1196       // way.  A zext load from NVT thus automatically gives zext from SrcVT.
1197
1198       ISD::LoadExtType NewExtType =
1199         ExtType == ISD::ZEXTLOAD ? ISD::ZEXTLOAD : ISD::EXTLOAD;
1200
1201       Result = DAG.getExtLoad(NewExtType, dl, Node->getValueType(0),
1202                               Tmp1, Tmp2, LD->getPointerInfo(),
1203                               NVT, isVolatile, isNonTemporal, Alignment);
1204
1205       Ch = Result.getValue(1); // The chain.
1206
1207       if (ExtType == ISD::SEXTLOAD)
1208         // Having the top bits zero doesn't help when sign extending.
1209         Result = DAG.getNode(ISD::SIGN_EXTEND_INREG, dl,
1210                              Result.getValueType(),
1211                              Result, DAG.getValueType(SrcVT));
1212       else if (ExtType == ISD::ZEXTLOAD || NVT == Result.getValueType())
1213         // All the top bits are guaranteed to be zero - inform the optimizers.
1214         Result = DAG.getNode(ISD::AssertZext, dl,
1215                              Result.getValueType(), Result,
1216                              DAG.getValueType(SrcVT));
1217
1218       Tmp1 = LegalizeOp(Result);
1219       Tmp2 = LegalizeOp(Ch);
1220     } else if (SrcWidth & (SrcWidth - 1)) {
1221       // If not loading a power-of-2 number of bits, expand as two loads.
1222       assert(!SrcVT.isVector() && "Unsupported extload!");
1223       unsigned RoundWidth = 1 << Log2_32(SrcWidth);
1224       assert(RoundWidth < SrcWidth);
1225       unsigned ExtraWidth = SrcWidth - RoundWidth;
1226       assert(ExtraWidth < RoundWidth);
1227       assert(!(RoundWidth % 8) && !(ExtraWidth % 8) &&
1228              "Load size not an integral number of bytes!");
1229       EVT RoundVT = EVT::getIntegerVT(*DAG.getContext(), RoundWidth);
1230       EVT ExtraVT = EVT::getIntegerVT(*DAG.getContext(), ExtraWidth);
1231       SDValue Lo, Hi, Ch;
1232       unsigned IncrementSize;
1233
1234       if (TLI.isLittleEndian()) {
1235         // EXTLOAD:i24 -> ZEXTLOAD:i16 | (shl EXTLOAD@+2:i8, 16)
1236         // Load the bottom RoundWidth bits.
1237         Lo = DAG.getExtLoad(ISD::ZEXTLOAD, dl, Node->getValueType(0),
1238                             Tmp1, Tmp2,
1239                             LD->getPointerInfo(), RoundVT, isVolatile,
1240                             isNonTemporal, Alignment);
1241
1242         // Load the remaining ExtraWidth bits.
1243         IncrementSize = RoundWidth / 8;
1244         Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
1245                            DAG.getIntPtrConstant(IncrementSize));
1246         Hi = DAG.getExtLoad(ExtType, dl, Node->getValueType(0), Tmp1, Tmp2,
1247                             LD->getPointerInfo().getWithOffset(IncrementSize),
1248                             ExtraVT, isVolatile, isNonTemporal,
1249                             MinAlign(Alignment, IncrementSize));
1250
1251         // Build a factor node to remember that this load is independent of
1252         // the other one.
1253         Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(1),
1254                          Hi.getValue(1));
1255
1256         // Move the top bits to the right place.
1257         Hi = DAG.getNode(ISD::SHL, dl, Hi.getValueType(), Hi,
1258                          DAG.getConstant(RoundWidth,
1259                                       TLI.getShiftAmountTy(Hi.getValueType())));
1260
1261         // Join the hi and lo parts.
1262         Result = DAG.getNode(ISD::OR, dl, Node->getValueType(0), Lo, Hi);
1263       } else {
1264         // Big endian - avoid unaligned loads.
1265         // EXTLOAD:i24 -> (shl EXTLOAD:i16, 8) | ZEXTLOAD@+2:i8
1266         // Load the top RoundWidth bits.
1267         Hi = DAG.getExtLoad(ExtType, dl, Node->getValueType(0), Tmp1, Tmp2,
1268                             LD->getPointerInfo(), RoundVT, isVolatile,
1269                             isNonTemporal, Alignment);
1270
1271         // Load the remaining ExtraWidth bits.
1272         IncrementSize = RoundWidth / 8;
1273         Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
1274                            DAG.getIntPtrConstant(IncrementSize));
1275         Lo = DAG.getExtLoad(ISD::ZEXTLOAD,
1276                             dl, Node->getValueType(0), Tmp1, Tmp2,
1277                             LD->getPointerInfo().getWithOffset(IncrementSize),
1278                             ExtraVT, isVolatile, isNonTemporal,
1279                             MinAlign(Alignment, IncrementSize));
1280
1281         // Build a factor node to remember that this load is independent of
1282         // the other one.
1283         Ch = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo.getValue(1),
1284                          Hi.getValue(1));
1285
1286         // Move the top bits to the right place.
1287         Hi = DAG.getNode(ISD::SHL, dl, Hi.getValueType(), Hi,
1288                          DAG.getConstant(ExtraWidth,
1289                                       TLI.getShiftAmountTy(Hi.getValueType())));
1290
1291         // Join the hi and lo parts.
1292         Result = DAG.getNode(ISD::OR, dl, Node->getValueType(0), Lo, Hi);
1293       }
1294
1295       Tmp1 = LegalizeOp(Result);
1296       Tmp2 = LegalizeOp(Ch);
1297     } else {
1298       switch (TLI.getLoadExtAction(ExtType, SrcVT)) {
1299       default: assert(0 && "This action is not supported yet!");
1300       case TargetLowering::Custom:
1301         isCustom = true;
1302         // FALLTHROUGH
1303       case TargetLowering::Legal:
1304         Result = SDValue(DAG.UpdateNodeOperands(Result.getNode(),
1305                                                 Tmp1, Tmp2, LD->getOffset()),
1306                          Result.getResNo());
1307         Tmp1 = Result.getValue(0);
1308         Tmp2 = Result.getValue(1);
1309
1310         if (isCustom) {
1311           Tmp3 = TLI.LowerOperation(Result, DAG);
1312           if (Tmp3.getNode()) {
1313             Tmp1 = LegalizeOp(Tmp3);
1314             Tmp2 = LegalizeOp(Tmp3.getValue(1));
1315           }
1316         } else {
1317           // If this is an unaligned load and the target doesn't support it,
1318           // expand it.
1319           if (!TLI.allowsUnalignedMemoryAccesses(LD->getMemoryVT())) {
1320             const Type *Ty =
1321               LD->getMemoryVT().getTypeForEVT(*DAG.getContext());
1322             unsigned ABIAlignment =
1323               TLI.getTargetData()->getABITypeAlignment(Ty);
1324             if (LD->getAlignment() < ABIAlignment){
1325               Result = ExpandUnalignedLoad(cast<LoadSDNode>(Result.getNode()),
1326                                            DAG, TLI);
1327               Tmp1 = Result.getOperand(0);
1328               Tmp2 = Result.getOperand(1);
1329               Tmp1 = LegalizeOp(Tmp1);
1330               Tmp2 = LegalizeOp(Tmp2);
1331             }
1332           }
1333         }
1334         break;
1335       case TargetLowering::Expand:
1336         if (!TLI.isLoadExtLegal(ISD::EXTLOAD, SrcVT) && TLI.isTypeLegal(SrcVT)) {
1337           SDValue Load = DAG.getLoad(SrcVT, dl, Tmp1, Tmp2,
1338                                      LD->getPointerInfo(),
1339                                      LD->isVolatile(), LD->isNonTemporal(),
1340                                      LD->getAlignment());
1341           unsigned ExtendOp;
1342           switch (ExtType) {
1343           case ISD::EXTLOAD:
1344             ExtendOp = (SrcVT.isFloatingPoint() ?
1345                         ISD::FP_EXTEND : ISD::ANY_EXTEND);
1346             break;
1347           case ISD::SEXTLOAD: ExtendOp = ISD::SIGN_EXTEND; break;
1348           case ISD::ZEXTLOAD: ExtendOp = ISD::ZERO_EXTEND; break;
1349           default: llvm_unreachable("Unexpected extend load type!");
1350           }
1351           Result = DAG.getNode(ExtendOp, dl, Node->getValueType(0), Load);
1352           Tmp1 = LegalizeOp(Result);  // Relegalize new nodes.
1353           Tmp2 = LegalizeOp(Load.getValue(1));
1354           break;
1355         }
1356
1357         // If this is a promoted vector load, and the vector element types are
1358         // legal, then scalarize it.
1359         if (ExtType == ISD::EXTLOAD && SrcVT.isVector() &&
1360           TLI.isTypeLegal(Node->getValueType(0).getScalarType())) {
1361           SmallVector<SDValue, 8> LoadVals;
1362           SmallVector<SDValue, 8> LoadChains;
1363           unsigned NumElem = SrcVT.getVectorNumElements();
1364           unsigned Stride = SrcVT.getScalarType().getSizeInBits()/8;
1365
1366           for (unsigned Idx=0; Idx<NumElem; Idx++) {
1367             Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
1368                                 DAG.getIntPtrConstant(Stride));
1369             SDValue ScalarLoad = DAG.getExtLoad(ISD::EXTLOAD, dl,
1370                   Node->getValueType(0).getScalarType(),
1371                   Tmp1, Tmp2, LD->getPointerInfo().getWithOffset(Idx * Stride),
1372                   SrcVT.getScalarType(),
1373                   LD->isVolatile(), LD->isNonTemporal(),
1374                   LD->getAlignment());
1375
1376             LoadVals.push_back(ScalarLoad.getValue(0));
1377             LoadChains.push_back(ScalarLoad.getValue(1));
1378           }
1379           Result = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1380             &LoadChains[0], LoadChains.size());
1381           SDValue ValRes = DAG.getNode(ISD::BUILD_VECTOR, dl,
1382             Node->getValueType(0), &LoadVals[0], LoadVals.size());
1383
1384           Tmp1 = LegalizeOp(ValRes);  // Relegalize new nodes.
1385           Tmp2 = LegalizeOp(Result.getValue(0));  // Relegalize new nodes.
1386           break;
1387         }
1388
1389         // If this is a promoted vector load, and the vector element types are
1390         // illegal, create the promoted vector from bitcasted segments.
1391         if (ExtType == ISD::EXTLOAD && SrcVT.isVector()) {
1392           EVT MemElemTy = Node->getValueType(0).getScalarType();
1393           EVT SrcSclrTy = SrcVT.getScalarType();
1394           unsigned SizeRatio =
1395             (MemElemTy.getSizeInBits() / SrcSclrTy.getSizeInBits());
1396
1397           SmallVector<SDValue, 8> LoadVals;
1398           SmallVector<SDValue, 8> LoadChains;
1399           unsigned NumElem = SrcVT.getVectorNumElements();
1400           unsigned Stride = SrcVT.getScalarType().getSizeInBits()/8;
1401
1402           for (unsigned Idx=0; Idx<NumElem; Idx++) {
1403             Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
1404                                 DAG.getIntPtrConstant(Stride));
1405             SDValue ScalarLoad = DAG.getExtLoad(ISD::EXTLOAD, dl,
1406                   SrcVT.getScalarType(),
1407                   Tmp1, Tmp2, LD->getPointerInfo().getWithOffset(Idx * Stride),
1408                   SrcVT.getScalarType(),
1409                   LD->isVolatile(), LD->isNonTemporal(),
1410                   LD->getAlignment());
1411             if (TLI.isBigEndian()) {
1412               // MSB (which is garbage, comes first)
1413               LoadVals.push_back(ScalarLoad.getValue(0));
1414               for (unsigned i = 0; i<SizeRatio-1; ++i)
1415                 LoadVals.push_back(DAG.getUNDEF(SrcVT.getScalarType()));
1416             } else {
1417               // LSB (which is data, comes first)
1418               for (unsigned i = 0; i<SizeRatio-1; ++i)
1419                 LoadVals.push_back(DAG.getUNDEF(SrcVT.getScalarType()));
1420               LoadVals.push_back(ScalarLoad.getValue(0));
1421             }
1422             LoadChains.push_back(ScalarLoad.getValue(1));
1423           }
1424
1425           Result = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1426             &LoadChains[0], LoadChains.size());
1427           EVT TempWideVector = EVT::getVectorVT(*DAG.getContext(),
1428             SrcVT.getScalarType(), NumElem*SizeRatio);
1429           SDValue ValRes = DAG.getNode(ISD::BUILD_VECTOR, dl,
1430             TempWideVector, &LoadVals[0], LoadVals.size());
1431
1432           // Cast to the correct type
1433           ValRes = DAG.getNode(ISD::BITCAST, dl, Node->getValueType(0), ValRes);
1434
1435           Tmp1 = LegalizeOp(ValRes);  // Relegalize new nodes.
1436           Tmp2 = LegalizeOp(Result.getValue(0));  // Relegalize new nodes.
1437           break;
1438
1439         }
1440
1441         // FIXME: This does not work for vectors on most targets.  Sign- and
1442         // zero-extend operations are currently folded into extending loads,
1443         // whether they are legal or not, and then we end up here without any
1444         // support for legalizing them.
1445         assert(ExtType != ISD::EXTLOAD &&
1446                "EXTLOAD should always be supported!");
1447         // Turn the unsupported load into an EXTLOAD followed by an explicit
1448         // zero/sign extend inreg.
1449         Result = DAG.getExtLoad(ISD::EXTLOAD, dl, Node->getValueType(0),
1450                                 Tmp1, Tmp2, LD->getPointerInfo(), SrcVT,
1451                                 LD->isVolatile(), LD->isNonTemporal(),
1452                                 LD->getAlignment());
1453         SDValue ValRes;
1454         if (ExtType == ISD::SEXTLOAD)
1455           ValRes = DAG.getNode(ISD::SIGN_EXTEND_INREG, dl,
1456                                Result.getValueType(),
1457                                Result, DAG.getValueType(SrcVT));
1458         else
1459           ValRes = DAG.getZeroExtendInReg(Result, dl, SrcVT.getScalarType());
1460         Tmp1 = LegalizeOp(ValRes);  // Relegalize new nodes.
1461         Tmp2 = LegalizeOp(Result.getValue(1));  // Relegalize new nodes.
1462         break;
1463       }
1464     }
1465
1466     // Since loads produce two values, make sure to remember that we legalized
1467     // both of them.
1468     AddLegalizedOperand(SDValue(Node, 0), Tmp1);
1469     AddLegalizedOperand(SDValue(Node, 1), Tmp2);
1470     return Op.getResNo() ? Tmp2 : Tmp1;
1471   }
1472   case ISD::STORE: {
1473     StoreSDNode *ST = cast<StoreSDNode>(Node);
1474     Tmp1 = LegalizeOp(ST->getChain());    // Legalize the chain.
1475     Tmp2 = LegalizeOp(ST->getBasePtr());  // Legalize the pointer.
1476     unsigned Alignment = ST->getAlignment();
1477     bool isVolatile = ST->isVolatile();
1478     bool isNonTemporal = ST->isNonTemporal();
1479
1480     if (!ST->isTruncatingStore()) {
1481       if (SDNode *OptStore = OptimizeFloatStore(ST).getNode()) {
1482         Result = SDValue(OptStore, 0);
1483         break;
1484       }
1485
1486       {
1487         Tmp3 = LegalizeOp(ST->getValue());
1488         Result = SDValue(DAG.UpdateNodeOperands(Result.getNode(),
1489                                                 Tmp1, Tmp3, Tmp2,
1490                                                 ST->getOffset()),
1491                          Result.getResNo());
1492
1493         EVT VT = Tmp3.getValueType();
1494         switch (TLI.getOperationAction(ISD::STORE, VT)) {
1495         default: assert(0 && "This action is not supported yet!");
1496         case TargetLowering::Legal:
1497           // If this is an unaligned store and the target doesn't support it,
1498           // expand it.
1499           if (!TLI.allowsUnalignedMemoryAccesses(ST->getMemoryVT())) {
1500             const Type *Ty = ST->getMemoryVT().getTypeForEVT(*DAG.getContext());
1501             unsigned ABIAlignment= TLI.getTargetData()->getABITypeAlignment(Ty);
1502             if (ST->getAlignment() < ABIAlignment)
1503               Result = ExpandUnalignedStore(cast<StoreSDNode>(Result.getNode()),
1504                                             DAG, TLI);
1505           }
1506           break;
1507         case TargetLowering::Custom:
1508           Tmp1 = TLI.LowerOperation(Result, DAG);
1509           if (Tmp1.getNode()) Result = Tmp1;
1510           break;
1511         case TargetLowering::Promote:
1512           assert(VT.isVector() && "Unknown legal promote case!");
1513           Tmp3 = DAG.getNode(ISD::BITCAST, dl,
1514                              TLI.getTypeToPromoteTo(ISD::STORE, VT), Tmp3);
1515           Result = DAG.getStore(Tmp1, dl, Tmp3, Tmp2,
1516                                 ST->getPointerInfo(), isVolatile,
1517                                 isNonTemporal, Alignment);
1518           break;
1519         }
1520         break;
1521       }
1522     } else {
1523       Tmp3 = LegalizeOp(ST->getValue());
1524
1525       EVT StVT = ST->getMemoryVT();
1526       unsigned StWidth = StVT.getSizeInBits();
1527
1528       if (StWidth != StVT.getStoreSizeInBits()) {
1529         // Promote to a byte-sized store with upper bits zero if not
1530         // storing an integral number of bytes.  For example, promote
1531         // TRUNCSTORE:i1 X -> TRUNCSTORE:i8 (and X, 1)
1532         EVT NVT = EVT::getIntegerVT(*DAG.getContext(),
1533                                     StVT.getStoreSizeInBits());
1534         Tmp3 = DAG.getZeroExtendInReg(Tmp3, dl, StVT);
1535         Result = DAG.getTruncStore(Tmp1, dl, Tmp3, Tmp2, ST->getPointerInfo(),
1536                                    NVT, isVolatile, isNonTemporal, Alignment);
1537       } else if (StWidth & (StWidth - 1)) {
1538         // If not storing a power-of-2 number of bits, expand as two stores.
1539         assert(!StVT.isVector() && "Unsupported truncstore!");
1540         unsigned RoundWidth = 1 << Log2_32(StWidth);
1541         assert(RoundWidth < StWidth);
1542         unsigned ExtraWidth = StWidth - RoundWidth;
1543         assert(ExtraWidth < RoundWidth);
1544         assert(!(RoundWidth % 8) && !(ExtraWidth % 8) &&
1545                "Store size not an integral number of bytes!");
1546         EVT RoundVT = EVT::getIntegerVT(*DAG.getContext(), RoundWidth);
1547         EVT ExtraVT = EVT::getIntegerVT(*DAG.getContext(), ExtraWidth);
1548         SDValue Lo, Hi;
1549         unsigned IncrementSize;
1550
1551         if (TLI.isLittleEndian()) {
1552           // TRUNCSTORE:i24 X -> TRUNCSTORE:i16 X, TRUNCSTORE@+2:i8 (srl X, 16)
1553           // Store the bottom RoundWidth bits.
1554           Lo = DAG.getTruncStore(Tmp1, dl, Tmp3, Tmp2, ST->getPointerInfo(),
1555                                  RoundVT,
1556                                  isVolatile, isNonTemporal, Alignment);
1557
1558           // Store the remaining ExtraWidth bits.
1559           IncrementSize = RoundWidth / 8;
1560           Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
1561                              DAG.getIntPtrConstant(IncrementSize));
1562           Hi = DAG.getNode(ISD::SRL, dl, Tmp3.getValueType(), Tmp3,
1563                            DAG.getConstant(RoundWidth,
1564                                     TLI.getShiftAmountTy(Tmp3.getValueType())));
1565           Hi = DAG.getTruncStore(Tmp1, dl, Hi, Tmp2,
1566                              ST->getPointerInfo().getWithOffset(IncrementSize),
1567                                  ExtraVT, isVolatile, isNonTemporal,
1568                                  MinAlign(Alignment, IncrementSize));
1569         } else {
1570           // Big endian - avoid unaligned stores.
1571           // TRUNCSTORE:i24 X -> TRUNCSTORE:i16 (srl X, 8), TRUNCSTORE@+2:i8 X
1572           // Store the top RoundWidth bits.
1573           Hi = DAG.getNode(ISD::SRL, dl, Tmp3.getValueType(), Tmp3,
1574                            DAG.getConstant(ExtraWidth,
1575                                     TLI.getShiftAmountTy(Tmp3.getValueType())));
1576           Hi = DAG.getTruncStore(Tmp1, dl, Hi, Tmp2, ST->getPointerInfo(),
1577                                  RoundVT, isVolatile, isNonTemporal, Alignment);
1578
1579           // Store the remaining ExtraWidth bits.
1580           IncrementSize = RoundWidth / 8;
1581           Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
1582                              DAG.getIntPtrConstant(IncrementSize));
1583           Lo = DAG.getTruncStore(Tmp1, dl, Tmp3, Tmp2,
1584                               ST->getPointerInfo().getWithOffset(IncrementSize),
1585                                  ExtraVT, isVolatile, isNonTemporal,
1586                                  MinAlign(Alignment, IncrementSize));
1587         }
1588
1589         // The order of the stores doesn't matter.
1590         Result = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, Lo, Hi);
1591       } else {
1592         if (Tmp1 != ST->getChain() || Tmp3 != ST->getValue() ||
1593             Tmp2 != ST->getBasePtr())
1594           Result = SDValue(DAG.UpdateNodeOperands(Result.getNode(),
1595                                                   Tmp1, Tmp3, Tmp2,
1596                                                   ST->getOffset()),
1597                            Result.getResNo());
1598
1599         switch (TLI.getTruncStoreAction(ST->getValue().getValueType(), StVT)) {
1600         default: assert(0 && "This action is not supported yet!");
1601         case TargetLowering::Legal:
1602           // If this is an unaligned store and the target doesn't support it,
1603           // expand it.
1604           if (!TLI.allowsUnalignedMemoryAccesses(ST->getMemoryVT())) {
1605             const Type *Ty = ST->getMemoryVT().getTypeForEVT(*DAG.getContext());
1606             unsigned ABIAlignment= TLI.getTargetData()->getABITypeAlignment(Ty);
1607             if (ST->getAlignment() < ABIAlignment)
1608               Result = ExpandUnalignedStore(cast<StoreSDNode>(Result.getNode()),
1609                                             DAG, TLI);
1610           }
1611           break;
1612         case TargetLowering::Custom:
1613           Result = TLI.LowerOperation(Result, DAG);
1614           break;
1615         case Expand:
1616
1617           EVT WideScalarVT = Tmp3.getValueType().getScalarType();
1618           EVT NarrowScalarVT = StVT.getScalarType();
1619
1620           // The Store type is illegal, must scalarize the vector store.
1621           SmallVector<SDValue, 8> Stores;
1622           bool ScalarLegal = TLI.isTypeLegal(WideScalarVT);
1623           if (!TLI.isTypeLegal(StVT) && StVT.isVector() && ScalarLegal) {
1624             unsigned NumElem = StVT.getVectorNumElements();
1625
1626             unsigned ScalarSize = StVT.getScalarType().getSizeInBits();
1627             // Round odd types to the next pow of two.
1628             if (!isPowerOf2_32(ScalarSize))
1629               ScalarSize = NextPowerOf2(ScalarSize);
1630             // Types smaller than 8 bits are promoted to 8 bits.
1631             ScalarSize = std::max<unsigned>(ScalarSize, 8);
1632             // Store stride
1633             unsigned Stride = ScalarSize/8;
1634             assert(isPowerOf2_32(Stride) && "Stride must be a power of two");
1635
1636             for (unsigned Idx=0; Idx<NumElem; Idx++) {
1637               SDValue Ex = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl,
1638                                        WideScalarVT, Tmp3, DAG.getIntPtrConstant(Idx));
1639
1640
1641               EVT NVT = EVT::getIntegerVT(*DAG.getContext(), ScalarSize);
1642
1643               Ex = DAG.getNode(ISD::TRUNCATE, dl, NVT, Ex);
1644               Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
1645                                  DAG.getIntPtrConstant(Stride));
1646               SDValue Store = DAG.getStore(Tmp1, dl, Ex, Tmp2,
1647                                            ST->getPointerInfo().getWithOffset(Idx*Stride),
1648                                            isVolatile, isNonTemporal, Alignment);
1649               Stores.push_back(Store);
1650             }
1651             Result = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1652                                  &Stores[0], Stores.size());
1653             break;
1654           }
1655
1656           // The Store type is illegal, must scalarize the vector store.
1657           // However, the scalar type is illegal. Must bitcast the result
1658           // and store it in smaller parts.
1659           if (!TLI.isTypeLegal(StVT) && StVT.isVector()) {
1660             unsigned WideNumElem = StVT.getVectorNumElements();
1661             unsigned Stride = NarrowScalarVT.getSizeInBits()/8;
1662
1663             unsigned SizeRatio =
1664               (WideScalarVT.getSizeInBits() / NarrowScalarVT.getSizeInBits());
1665
1666             EVT CastValueVT = EVT::getVectorVT(*DAG.getContext(), NarrowScalarVT,
1667                                                SizeRatio*WideNumElem);
1668
1669             // Cast the wide elem vector to wider vec with smaller elem type.
1670             // Example <2 x i64> -> <4 x i32>
1671             Tmp3 = DAG.getNode(ISD::BITCAST, dl, CastValueVT, Tmp3);
1672
1673             for (unsigned Idx=0; Idx<WideNumElem*SizeRatio; Idx++) {
1674               // Extract elment i
1675               SDValue Ex = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl,
1676                                        NarrowScalarVT, Tmp3, DAG.getIntPtrConstant(Idx));
1677               // bump pointer.
1678               Tmp2 = DAG.getNode(ISD::ADD, dl, Tmp2.getValueType(), Tmp2,
1679                                  DAG.getIntPtrConstant(Stride));
1680
1681               // Store if, this element is:
1682               //  - First element on big endian, or
1683               //  - Last element on little endian
1684               if (( TLI.isBigEndian() && (Idx%SizeRatio == 0)) ||
1685                   ((!TLI.isBigEndian() && (Idx%SizeRatio == SizeRatio-1)))) {
1686                 SDValue Store = DAG.getStore(Tmp1, dl, Ex, Tmp2,
1687                                              ST->getPointerInfo().getWithOffset(Idx*Stride),
1688                                              isVolatile, isNonTemporal, Alignment);
1689                 Stores.push_back(Store);
1690               }
1691             }
1692             Result = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1693                                  &Stores[0], Stores.size());
1694             break;
1695           }
1696
1697
1698           // TRUNCSTORE:i16 i32 -> STORE i16
1699           assert(TLI.isTypeLegal(StVT) && "Do not know how to expand this store!");
1700           Tmp3 = DAG.getNode(ISD::TRUNCATE, dl, StVT, Tmp3);
1701           Result = DAG.getStore(Tmp1, dl, Tmp3, Tmp2, ST->getPointerInfo(),
1702                                 isVolatile, isNonTemporal, Alignment);
1703           break;
1704         }
1705       }
1706     }
1707     break;
1708   }
1709   }
1710   assert(Result.getValueType() == Op.getValueType() &&
1711          "Bad legalization!");
1712
1713   // Make sure that the generated code is itself legal.
1714   if (Result != Op)
1715     Result = LegalizeOp(Result);
1716
1717   // Note that LegalizeOp may be reentered even from single-use nodes, which
1718   // means that we always must cache transformed nodes.
1719   AddLegalizedOperand(Op, Result);
1720   return Result;
1721 }
1722
1723 SDValue SelectionDAGLegalize::ExpandExtractFromVectorThroughStack(SDValue Op) {
1724   SDValue Vec = Op.getOperand(0);
1725   SDValue Idx = Op.getOperand(1);
1726   DebugLoc dl = Op.getDebugLoc();
1727   // Store the value to a temporary stack slot, then LOAD the returned part.
1728   SDValue StackPtr = DAG.CreateStackTemporary(Vec.getValueType());
1729   SDValue Ch = DAG.getStore(DAG.getEntryNode(), dl, Vec, StackPtr,
1730                             MachinePointerInfo(), false, false, 0);
1731
1732   // Add the offset to the index.
1733   unsigned EltSize =
1734       Vec.getValueType().getVectorElementType().getSizeInBits()/8;
1735   Idx = DAG.getNode(ISD::MUL, dl, Idx.getValueType(), Idx,
1736                     DAG.getConstant(EltSize, Idx.getValueType()));
1737
1738   if (Idx.getValueType().bitsGT(TLI.getPointerTy()))
1739     Idx = DAG.getNode(ISD::TRUNCATE, dl, TLI.getPointerTy(), Idx);
1740   else
1741     Idx = DAG.getNode(ISD::ZERO_EXTEND, dl, TLI.getPointerTy(), Idx);
1742
1743   StackPtr = DAG.getNode(ISD::ADD, dl, Idx.getValueType(), Idx, StackPtr);
1744
1745   if (Op.getValueType().isVector())
1746     return DAG.getLoad(Op.getValueType(), dl, Ch, StackPtr,MachinePointerInfo(),
1747                        false, false, 0);
1748   return DAG.getExtLoad(ISD::EXTLOAD, dl, Op.getValueType(), Ch, StackPtr,
1749                         MachinePointerInfo(),
1750                         Vec.getValueType().getVectorElementType(),
1751                         false, false, 0);
1752 }
1753
1754 SDValue SelectionDAGLegalize::ExpandInsertToVectorThroughStack(SDValue Op) {
1755   assert(Op.getValueType().isVector() && "Non-vector insert subvector!");
1756
1757   SDValue Vec  = Op.getOperand(0);
1758   SDValue Part = Op.getOperand(1);
1759   SDValue Idx  = Op.getOperand(2);
1760   DebugLoc dl  = Op.getDebugLoc();
1761
1762   // Store the value to a temporary stack slot, then LOAD the returned part.
1763
1764   SDValue StackPtr = DAG.CreateStackTemporary(Vec.getValueType());
1765   int FI = cast<FrameIndexSDNode>(StackPtr.getNode())->getIndex();
1766   MachinePointerInfo PtrInfo = MachinePointerInfo::getFixedStack(FI);
1767
1768   // First store the whole vector.
1769   SDValue Ch = DAG.getStore(DAG.getEntryNode(), dl, Vec, StackPtr, PtrInfo,
1770                             false, false, 0);
1771
1772   // Then store the inserted part.
1773
1774   // Add the offset to the index.
1775   unsigned EltSize =
1776       Vec.getValueType().getVectorElementType().getSizeInBits()/8;
1777
1778   Idx = DAG.getNode(ISD::MUL, dl, Idx.getValueType(), Idx,
1779                     DAG.getConstant(EltSize, Idx.getValueType()));
1780
1781   if (Idx.getValueType().bitsGT(TLI.getPointerTy()))
1782     Idx = DAG.getNode(ISD::TRUNCATE, dl, TLI.getPointerTy(), Idx);
1783   else
1784     Idx = DAG.getNode(ISD::ZERO_EXTEND, dl, TLI.getPointerTy(), Idx);
1785
1786   SDValue SubStackPtr = DAG.getNode(ISD::ADD, dl, Idx.getValueType(), Idx,
1787                                     StackPtr);
1788
1789   // Store the subvector.
1790   Ch = DAG.getStore(DAG.getEntryNode(), dl, Part, SubStackPtr,
1791                     MachinePointerInfo(), false, false, 0);
1792
1793   // Finally, load the updated vector.
1794   return DAG.getLoad(Op.getValueType(), dl, Ch, StackPtr, PtrInfo,
1795                      false, false, 0);
1796 }
1797
1798 SDValue SelectionDAGLegalize::ExpandVectorBuildThroughStack(SDNode* Node) {
1799   // We can't handle this case efficiently.  Allocate a sufficiently
1800   // aligned object on the stack, store each element into it, then load
1801   // the result as a vector.
1802   // Create the stack frame object.
1803   EVT VT = Node->getValueType(0);
1804   EVT EltVT = VT.getVectorElementType();
1805   DebugLoc dl = Node->getDebugLoc();
1806   SDValue FIPtr = DAG.CreateStackTemporary(VT);
1807   int FI = cast<FrameIndexSDNode>(FIPtr.getNode())->getIndex();
1808   MachinePointerInfo PtrInfo = MachinePointerInfo::getFixedStack(FI);
1809
1810   // Emit a store of each element to the stack slot.
1811   SmallVector<SDValue, 8> Stores;
1812   unsigned TypeByteSize = EltVT.getSizeInBits() / 8;
1813   // Store (in the right endianness) the elements to memory.
1814   for (unsigned i = 0, e = Node->getNumOperands(); i != e; ++i) {
1815     // Ignore undef elements.
1816     if (Node->getOperand(i).getOpcode() == ISD::UNDEF) continue;
1817
1818     unsigned Offset = TypeByteSize*i;
1819
1820     SDValue Idx = DAG.getConstant(Offset, FIPtr.getValueType());
1821     Idx = DAG.getNode(ISD::ADD, dl, FIPtr.getValueType(), FIPtr, Idx);
1822
1823     // If the destination vector element type is narrower than the source
1824     // element type, only store the bits necessary.
1825     if (EltVT.bitsLT(Node->getOperand(i).getValueType().getScalarType())) {
1826       Stores.push_back(DAG.getTruncStore(DAG.getEntryNode(), dl,
1827                                          Node->getOperand(i), Idx,
1828                                          PtrInfo.getWithOffset(Offset),
1829                                          EltVT, false, false, 0));
1830     } else
1831       Stores.push_back(DAG.getStore(DAG.getEntryNode(), dl,
1832                                     Node->getOperand(i), Idx,
1833                                     PtrInfo.getWithOffset(Offset),
1834                                     false, false, 0));
1835   }
1836
1837   SDValue StoreChain;
1838   if (!Stores.empty())    // Not all undef elements?
1839     StoreChain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1840                              &Stores[0], Stores.size());
1841   else
1842     StoreChain = DAG.getEntryNode();
1843
1844   // Result is a load from the stack slot.
1845   return DAG.getLoad(VT, dl, StoreChain, FIPtr, PtrInfo, false, false, 0);
1846 }
1847
1848 SDValue SelectionDAGLegalize::ExpandFCOPYSIGN(SDNode* Node) {
1849   DebugLoc dl = Node->getDebugLoc();
1850   SDValue Tmp1 = Node->getOperand(0);
1851   SDValue Tmp2 = Node->getOperand(1);
1852
1853   // Get the sign bit of the RHS.  First obtain a value that has the same
1854   // sign as the sign bit, i.e. negative if and only if the sign bit is 1.
1855   SDValue SignBit;
1856   EVT FloatVT = Tmp2.getValueType();
1857   EVT IVT = EVT::getIntegerVT(*DAG.getContext(), FloatVT.getSizeInBits());
1858   if (TLI.isTypeLegal(IVT)) {
1859     // Convert to an integer with the same sign bit.
1860     SignBit = DAG.getNode(ISD::BITCAST, dl, IVT, Tmp2);
1861   } else {
1862     // Store the float to memory, then load the sign part out as an integer.
1863     MVT LoadTy = TLI.getPointerTy();
1864     // First create a temporary that is aligned for both the load and store.
1865     SDValue StackPtr = DAG.CreateStackTemporary(FloatVT, LoadTy);
1866     // Then store the float to it.
1867     SDValue Ch =
1868       DAG.getStore(DAG.getEntryNode(), dl, Tmp2, StackPtr, MachinePointerInfo(),
1869                    false, false, 0);
1870     if (TLI.isBigEndian()) {
1871       assert(FloatVT.isByteSized() && "Unsupported floating point type!");
1872       // Load out a legal integer with the same sign bit as the float.
1873       SignBit = DAG.getLoad(LoadTy, dl, Ch, StackPtr, MachinePointerInfo(),
1874                             false, false, 0);
1875     } else { // Little endian
1876       SDValue LoadPtr = StackPtr;
1877       // The float may be wider than the integer we are going to load.  Advance
1878       // the pointer so that the loaded integer will contain the sign bit.
1879       unsigned Strides = (FloatVT.getSizeInBits()-1)/LoadTy.getSizeInBits();
1880       unsigned ByteOffset = (Strides * LoadTy.getSizeInBits()) / 8;
1881       LoadPtr = DAG.getNode(ISD::ADD, dl, LoadPtr.getValueType(),
1882                             LoadPtr, DAG.getIntPtrConstant(ByteOffset));
1883       // Load a legal integer containing the sign bit.
1884       SignBit = DAG.getLoad(LoadTy, dl, Ch, LoadPtr, MachinePointerInfo(),
1885                             false, false, 0);
1886       // Move the sign bit to the top bit of the loaded integer.
1887       unsigned BitShift = LoadTy.getSizeInBits() -
1888         (FloatVT.getSizeInBits() - 8 * ByteOffset);
1889       assert(BitShift < LoadTy.getSizeInBits() && "Pointer advanced wrong?");
1890       if (BitShift)
1891         SignBit = DAG.getNode(ISD::SHL, dl, LoadTy, SignBit,
1892                               DAG.getConstant(BitShift,
1893                                  TLI.getShiftAmountTy(SignBit.getValueType())));
1894     }
1895   }
1896   // Now get the sign bit proper, by seeing whether the value is negative.
1897   SignBit = DAG.getSetCC(dl, TLI.getSetCCResultType(SignBit.getValueType()),
1898                          SignBit, DAG.getConstant(0, SignBit.getValueType()),
1899                          ISD::SETLT);
1900   // Get the absolute value of the result.
1901   SDValue AbsVal = DAG.getNode(ISD::FABS, dl, Tmp1.getValueType(), Tmp1);
1902   // Select between the nabs and abs value based on the sign bit of
1903   // the input.
1904   return DAG.getNode(ISD::SELECT, dl, AbsVal.getValueType(), SignBit,
1905                      DAG.getNode(ISD::FNEG, dl, AbsVal.getValueType(), AbsVal),
1906                      AbsVal);
1907 }
1908
1909 void SelectionDAGLegalize::ExpandDYNAMIC_STACKALLOC(SDNode* Node,
1910                                            SmallVectorImpl<SDValue> &Results) {
1911   unsigned SPReg = TLI.getStackPointerRegisterToSaveRestore();
1912   assert(SPReg && "Target cannot require DYNAMIC_STACKALLOC expansion and"
1913           " not tell us which reg is the stack pointer!");
1914   DebugLoc dl = Node->getDebugLoc();
1915   EVT VT = Node->getValueType(0);
1916   SDValue Tmp1 = SDValue(Node, 0);
1917   SDValue Tmp2 = SDValue(Node, 1);
1918   SDValue Tmp3 = Node->getOperand(2);
1919   SDValue Chain = Tmp1.getOperand(0);
1920
1921   // Chain the dynamic stack allocation so that it doesn't modify the stack
1922   // pointer when other instructions are using the stack.
1923   Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(0, true));
1924
1925   SDValue Size  = Tmp2.getOperand(1);
1926   SDValue SP = DAG.getCopyFromReg(Chain, dl, SPReg, VT);
1927   Chain = SP.getValue(1);
1928   unsigned Align = cast<ConstantSDNode>(Tmp3)->getZExtValue();
1929   unsigned StackAlign = TM.getFrameLowering()->getStackAlignment();
1930   if (Align > StackAlign)
1931     SP = DAG.getNode(ISD::AND, dl, VT, SP,
1932                       DAG.getConstant(-(uint64_t)Align, VT));
1933   Tmp1 = DAG.getNode(ISD::SUB, dl, VT, SP, Size);       // Value
1934   Chain = DAG.getCopyToReg(Chain, dl, SPReg, Tmp1);     // Output chain
1935
1936   Tmp2 = DAG.getCALLSEQ_END(Chain,  DAG.getIntPtrConstant(0, true),
1937                             DAG.getIntPtrConstant(0, true), SDValue());
1938
1939   Results.push_back(Tmp1);
1940   Results.push_back(Tmp2);
1941 }
1942
1943 /// LegalizeSetCCCondCode - Legalize a SETCC with given LHS and RHS and
1944 /// condition code CC on the current target. This routine expands SETCC with
1945 /// illegal condition code into AND / OR of multiple SETCC values.
1946 void SelectionDAGLegalize::LegalizeSetCCCondCode(EVT VT,
1947                                                  SDValue &LHS, SDValue &RHS,
1948                                                  SDValue &CC,
1949                                                  DebugLoc dl) {
1950   EVT OpVT = LHS.getValueType();
1951   ISD::CondCode CCCode = cast<CondCodeSDNode>(CC)->get();
1952   switch (TLI.getCondCodeAction(CCCode, OpVT)) {
1953   default: assert(0 && "Unknown condition code action!");
1954   case TargetLowering::Legal:
1955     // Nothing to do.
1956     break;
1957   case TargetLowering::Expand: {
1958     ISD::CondCode CC1 = ISD::SETCC_INVALID, CC2 = ISD::SETCC_INVALID;
1959     unsigned Opc = 0;
1960     switch (CCCode) {
1961     default: assert(0 && "Don't know how to expand this condition!");
1962     case ISD::SETOEQ: CC1 = ISD::SETEQ; CC2 = ISD::SETO;  Opc = ISD::AND; break;
1963     case ISD::SETOGT: CC1 = ISD::SETGT; CC2 = ISD::SETO;  Opc = ISD::AND; break;
1964     case ISD::SETOGE: CC1 = ISD::SETGE; CC2 = ISD::SETO;  Opc = ISD::AND; break;
1965     case ISD::SETOLT: CC1 = ISD::SETLT; CC2 = ISD::SETO;  Opc = ISD::AND; break;
1966     case ISD::SETOLE: CC1 = ISD::SETLE; CC2 = ISD::SETO;  Opc = ISD::AND; break;
1967     case ISD::SETONE: CC1 = ISD::SETNE; CC2 = ISD::SETO;  Opc = ISD::AND; break;
1968     case ISD::SETUEQ: CC1 = ISD::SETEQ; CC2 = ISD::SETUO; Opc = ISD::OR;  break;
1969     case ISD::SETUGT: CC1 = ISD::SETGT; CC2 = ISD::SETUO; Opc = ISD::OR;  break;
1970     case ISD::SETUGE: CC1 = ISD::SETGE; CC2 = ISD::SETUO; Opc = ISD::OR;  break;
1971     case ISD::SETULT: CC1 = ISD::SETLT; CC2 = ISD::SETUO; Opc = ISD::OR;  break;
1972     case ISD::SETULE: CC1 = ISD::SETLE; CC2 = ISD::SETUO; Opc = ISD::OR;  break;
1973     case ISD::SETUNE: CC1 = ISD::SETNE; CC2 = ISD::SETUO; Opc = ISD::OR;  break;
1974     // FIXME: Implement more expansions.
1975     }
1976
1977     SDValue SetCC1 = DAG.getSetCC(dl, VT, LHS, RHS, CC1);
1978     SDValue SetCC2 = DAG.getSetCC(dl, VT, LHS, RHS, CC2);
1979     LHS = DAG.getNode(Opc, dl, VT, SetCC1, SetCC2);
1980     RHS = SDValue();
1981     CC  = SDValue();
1982     break;
1983   }
1984   }
1985 }
1986
1987 /// EmitStackConvert - Emit a store/load combination to the stack.  This stores
1988 /// SrcOp to a stack slot of type SlotVT, truncating it if needed.  It then does
1989 /// a load from the stack slot to DestVT, extending it if needed.
1990 /// The resultant code need not be legal.
1991 SDValue SelectionDAGLegalize::EmitStackConvert(SDValue SrcOp,
1992                                                EVT SlotVT,
1993                                                EVT DestVT,
1994                                                DebugLoc dl) {
1995   // Create the stack frame object.
1996   unsigned SrcAlign =
1997     TLI.getTargetData()->getPrefTypeAlignment(SrcOp.getValueType().
1998                                               getTypeForEVT(*DAG.getContext()));
1999   SDValue FIPtr = DAG.CreateStackTemporary(SlotVT, SrcAlign);
2000
2001   FrameIndexSDNode *StackPtrFI = cast<FrameIndexSDNode>(FIPtr);
2002   int SPFI = StackPtrFI->getIndex();
2003   MachinePointerInfo PtrInfo = MachinePointerInfo::getFixedStack(SPFI);
2004
2005   unsigned SrcSize = SrcOp.getValueType().getSizeInBits();
2006   unsigned SlotSize = SlotVT.getSizeInBits();
2007   unsigned DestSize = DestVT.getSizeInBits();
2008   const Type *DestType = DestVT.getTypeForEVT(*DAG.getContext());
2009   unsigned DestAlign = TLI.getTargetData()->getPrefTypeAlignment(DestType);
2010
2011   // Emit a store to the stack slot.  Use a truncstore if the input value is
2012   // later than DestVT.
2013   SDValue Store;
2014
2015   if (SrcSize > SlotSize)
2016     Store = DAG.getTruncStore(DAG.getEntryNode(), dl, SrcOp, FIPtr,
2017                               PtrInfo, SlotVT, false, false, SrcAlign);
2018   else {
2019     assert(SrcSize == SlotSize && "Invalid store");
2020     Store = DAG.getStore(DAG.getEntryNode(), dl, SrcOp, FIPtr,
2021                          PtrInfo, false, false, SrcAlign);
2022   }
2023
2024   // Result is a load from the stack slot.
2025   if (SlotSize == DestSize)
2026     return DAG.getLoad(DestVT, dl, Store, FIPtr, PtrInfo,
2027                        false, false, DestAlign);
2028
2029   assert(SlotSize < DestSize && "Unknown extension!");
2030   return DAG.getExtLoad(ISD::EXTLOAD, dl, DestVT, Store, FIPtr,
2031                         PtrInfo, SlotVT, false, false, DestAlign);
2032 }
2033
2034 SDValue SelectionDAGLegalize::ExpandSCALAR_TO_VECTOR(SDNode *Node) {
2035   DebugLoc dl = Node->getDebugLoc();
2036   // Create a vector sized/aligned stack slot, store the value to element #0,
2037   // then load the whole vector back out.
2038   SDValue StackPtr = DAG.CreateStackTemporary(Node->getValueType(0));
2039
2040   FrameIndexSDNode *StackPtrFI = cast<FrameIndexSDNode>(StackPtr);
2041   int SPFI = StackPtrFI->getIndex();
2042
2043   SDValue Ch = DAG.getTruncStore(DAG.getEntryNode(), dl, Node->getOperand(0),
2044                                  StackPtr,
2045                                  MachinePointerInfo::getFixedStack(SPFI),
2046                                  Node->getValueType(0).getVectorElementType(),
2047                                  false, false, 0);
2048   return DAG.getLoad(Node->getValueType(0), dl, Ch, StackPtr,
2049                      MachinePointerInfo::getFixedStack(SPFI),
2050                      false, false, 0);
2051 }
2052
2053
2054 /// ExpandBUILD_VECTOR - Expand a BUILD_VECTOR node on targets that don't
2055 /// support the operation, but do support the resultant vector type.
2056 SDValue SelectionDAGLegalize::ExpandBUILD_VECTOR(SDNode *Node) {
2057   unsigned NumElems = Node->getNumOperands();
2058   SDValue Value1, Value2;
2059   DebugLoc dl = Node->getDebugLoc();
2060   EVT VT = Node->getValueType(0);
2061   EVT OpVT = Node->getOperand(0).getValueType();
2062   EVT EltVT = VT.getVectorElementType();
2063
2064   // If the only non-undef value is the low element, turn this into a
2065   // SCALAR_TO_VECTOR node.  If this is { X, X, X, X }, determine X.
2066   bool isOnlyLowElement = true;
2067   bool MoreThanTwoValues = false;
2068   bool isConstant = true;
2069   for (unsigned i = 0; i < NumElems; ++i) {
2070     SDValue V = Node->getOperand(i);
2071     if (V.getOpcode() == ISD::UNDEF)
2072       continue;
2073     if (i > 0)
2074       isOnlyLowElement = false;
2075     if (!isa<ConstantFPSDNode>(V) && !isa<ConstantSDNode>(V))
2076       isConstant = false;
2077
2078     if (!Value1.getNode()) {
2079       Value1 = V;
2080     } else if (!Value2.getNode()) {
2081       if (V != Value1)
2082         Value2 = V;
2083     } else if (V != Value1 && V != Value2) {
2084       MoreThanTwoValues = true;
2085     }
2086   }
2087
2088   if (!Value1.getNode())
2089     return DAG.getUNDEF(VT);
2090
2091   if (isOnlyLowElement)
2092     return DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, Node->getOperand(0));
2093
2094   // If all elements are constants, create a load from the constant pool.
2095   if (isConstant) {
2096     std::vector<Constant*> CV;
2097     for (unsigned i = 0, e = NumElems; i != e; ++i) {
2098       if (ConstantFPSDNode *V =
2099           dyn_cast<ConstantFPSDNode>(Node->getOperand(i))) {
2100         CV.push_back(const_cast<ConstantFP *>(V->getConstantFPValue()));
2101       } else if (ConstantSDNode *V =
2102                  dyn_cast<ConstantSDNode>(Node->getOperand(i))) {
2103         if (OpVT==EltVT)
2104           CV.push_back(const_cast<ConstantInt *>(V->getConstantIntValue()));
2105         else {
2106           // If OpVT and EltVT don't match, EltVT is not legal and the
2107           // element values have been promoted/truncated earlier.  Undo this;
2108           // we don't want a v16i8 to become a v16i32 for example.
2109           const ConstantInt *CI = V->getConstantIntValue();
2110           CV.push_back(ConstantInt::get(EltVT.getTypeForEVT(*DAG.getContext()),
2111                                         CI->getZExtValue()));
2112         }
2113       } else {
2114         assert(Node->getOperand(i).getOpcode() == ISD::UNDEF);
2115         const Type *OpNTy = EltVT.getTypeForEVT(*DAG.getContext());
2116         CV.push_back(UndefValue::get(OpNTy));
2117       }
2118     }
2119     Constant *CP = ConstantVector::get(CV);
2120     SDValue CPIdx = DAG.getConstantPool(CP, TLI.getPointerTy());
2121     unsigned Alignment = cast<ConstantPoolSDNode>(CPIdx)->getAlignment();
2122     return DAG.getLoad(VT, dl, DAG.getEntryNode(), CPIdx,
2123                        MachinePointerInfo::getConstantPool(),
2124                        false, false, Alignment);
2125   }
2126
2127   if (!MoreThanTwoValues) {
2128     SmallVector<int, 8> ShuffleVec(NumElems, -1);
2129     for (unsigned i = 0; i < NumElems; ++i) {
2130       SDValue V = Node->getOperand(i);
2131       if (V.getOpcode() == ISD::UNDEF)
2132         continue;
2133       ShuffleVec[i] = V == Value1 ? 0 : NumElems;
2134     }
2135     if (TLI.isShuffleMaskLegal(ShuffleVec, Node->getValueType(0))) {
2136       // Get the splatted value into the low element of a vector register.
2137       SDValue Vec1 = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, Value1);
2138       SDValue Vec2;
2139       if (Value2.getNode())
2140         Vec2 = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, Value2);
2141       else
2142         Vec2 = DAG.getUNDEF(VT);
2143
2144       // Return shuffle(LowValVec, undef, <0,0,0,0>)
2145       return DAG.getVectorShuffle(VT, dl, Vec1, Vec2, ShuffleVec.data());
2146     }
2147   }
2148
2149   // Otherwise, we can't handle this case efficiently.
2150   return ExpandVectorBuildThroughStack(Node);
2151 }
2152
2153 // ExpandLibCall - Expand a node into a call to a libcall.  If the result value
2154 // does not fit into a register, return the lo part and set the hi part to the
2155 // by-reg argument.  If it does fit into a single register, return the result
2156 // and leave the Hi part unset.
2157 SDValue SelectionDAGLegalize::ExpandLibCall(RTLIB::Libcall LC, SDNode *Node,
2158                                             bool isSigned) {
2159   // The input chain to this libcall is the entry node of the function.
2160   // Legalizing the call will automatically add the previous call to the
2161   // dependence.
2162   SDValue InChain = DAG.getEntryNode();
2163
2164   TargetLowering::ArgListTy Args;
2165   TargetLowering::ArgListEntry Entry;
2166   for (unsigned i = 0, e = Node->getNumOperands(); i != e; ++i) {
2167     EVT ArgVT = Node->getOperand(i).getValueType();
2168     const Type *ArgTy = ArgVT.getTypeForEVT(*DAG.getContext());
2169     Entry.Node = Node->getOperand(i); Entry.Ty = ArgTy;
2170     Entry.isSExt = isSigned;
2171     Entry.isZExt = !isSigned;
2172     Args.push_back(Entry);
2173   }
2174   SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC),
2175                                          TLI.getPointerTy());
2176
2177   // Splice the libcall in wherever FindInputOutputChains tells us to.
2178   const Type *RetTy = Node->getValueType(0).getTypeForEVT(*DAG.getContext());
2179
2180   // isTailCall may be true since the callee does not reference caller stack
2181   // frame. Check if it's in the right position.
2182   bool isTailCall = isInTailCallPosition(DAG, Node, TLI);
2183   std::pair<SDValue, SDValue> CallInfo =
2184     TLI.LowerCallTo(InChain, RetTy, isSigned, !isSigned, false, false,
2185                     0, TLI.getLibcallCallingConv(LC), isTailCall,
2186                     /*isReturnValueUsed=*/true,
2187                     Callee, Args, DAG, Node->getDebugLoc());
2188
2189   if (!CallInfo.second.getNode())
2190     // It's a tailcall, return the chain (which is the DAG root).
2191     return DAG.getRoot();
2192
2193   // Legalize the call sequence, starting with the chain.  This will advance
2194   // the LastCALLSEQ to the legalized version of the CALLSEQ_END node that
2195   // was added by LowerCallTo (guaranteeing proper serialization of calls).
2196   LegalizeOp(CallInfo.second);
2197   return CallInfo.first;
2198 }
2199
2200 /// ExpandLibCall - Generate a libcall taking the given operands as arguments
2201 /// and returning a result of type RetVT.
2202 SDValue SelectionDAGLegalize::ExpandLibCall(RTLIB::Libcall LC, EVT RetVT,
2203                                             const SDValue *Ops, unsigned NumOps,
2204                                             bool isSigned, DebugLoc dl) {
2205   TargetLowering::ArgListTy Args;
2206   Args.reserve(NumOps);
2207
2208   TargetLowering::ArgListEntry Entry;
2209   for (unsigned i = 0; i != NumOps; ++i) {
2210     Entry.Node = Ops[i];
2211     Entry.Ty = Entry.Node.getValueType().getTypeForEVT(*DAG.getContext());
2212     Entry.isSExt = isSigned;
2213     Entry.isZExt = !isSigned;
2214     Args.push_back(Entry);
2215   }
2216   SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC),
2217                                          TLI.getPointerTy());
2218
2219   const Type *RetTy = RetVT.getTypeForEVT(*DAG.getContext());
2220   std::pair<SDValue,SDValue> CallInfo =
2221   TLI.LowerCallTo(DAG.getEntryNode(), RetTy, isSigned, !isSigned, false,
2222                   false, 0, TLI.getLibcallCallingConv(LC), false,
2223                   /*isReturnValueUsed=*/true,
2224                   Callee, Args, DAG, dl);
2225
2226   // Legalize the call sequence, starting with the chain.  This will advance
2227   // the LastCALLSEQ_END to the legalized version of the CALLSEQ_END node that
2228   // was added by LowerCallTo (guaranteeing proper serialization of calls).
2229   LegalizeOp(CallInfo.second);
2230
2231   return CallInfo.first;
2232 }
2233
2234 // ExpandChainLibCall - Expand a node into a call to a libcall. Similar to
2235 // ExpandLibCall except that the first operand is the in-chain.
2236 std::pair<SDValue, SDValue>
2237 SelectionDAGLegalize::ExpandChainLibCall(RTLIB::Libcall LC,
2238                                          SDNode *Node,
2239                                          bool isSigned) {
2240   SDValue InChain = Node->getOperand(0);
2241
2242   TargetLowering::ArgListTy Args;
2243   TargetLowering::ArgListEntry Entry;
2244   for (unsigned i = 1, e = Node->getNumOperands(); i != e; ++i) {
2245     EVT ArgVT = Node->getOperand(i).getValueType();
2246     const Type *ArgTy = ArgVT.getTypeForEVT(*DAG.getContext());
2247     Entry.Node = Node->getOperand(i);
2248     Entry.Ty = ArgTy;
2249     Entry.isSExt = isSigned;
2250     Entry.isZExt = !isSigned;
2251     Args.push_back(Entry);
2252   }
2253   SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC),
2254                                          TLI.getPointerTy());
2255
2256   // Splice the libcall in wherever FindInputOutputChains tells us to.
2257   const Type *RetTy = Node->getValueType(0).getTypeForEVT(*DAG.getContext());
2258   std::pair<SDValue, SDValue> CallInfo =
2259     TLI.LowerCallTo(InChain, RetTy, isSigned, !isSigned, false, false,
2260                     0, TLI.getLibcallCallingConv(LC), /*isTailCall=*/false,
2261                     /*isReturnValueUsed=*/true,
2262                     Callee, Args, DAG, Node->getDebugLoc());
2263
2264   // Legalize the call sequence, starting with the chain.  This will advance
2265   // the LastCALLSEQ to the legalized version of the CALLSEQ_END node that
2266   // was added by LowerCallTo (guaranteeing proper serialization of calls).
2267   LegalizeOp(CallInfo.second);
2268   return CallInfo;
2269 }
2270
2271 SDValue SelectionDAGLegalize::ExpandFPLibCall(SDNode* Node,
2272                                               RTLIB::Libcall Call_F32,
2273                                               RTLIB::Libcall Call_F64,
2274                                               RTLIB::Libcall Call_F80,
2275                                               RTLIB::Libcall Call_PPCF128) {
2276   RTLIB::Libcall LC;
2277   switch (Node->getValueType(0).getSimpleVT().SimpleTy) {
2278   default: assert(0 && "Unexpected request for libcall!");
2279   case MVT::f32: LC = Call_F32; break;
2280   case MVT::f64: LC = Call_F64; break;
2281   case MVT::f80: LC = Call_F80; break;
2282   case MVT::ppcf128: LC = Call_PPCF128; break;
2283   }
2284   return ExpandLibCall(LC, Node, false);
2285 }
2286
2287 SDValue SelectionDAGLegalize::ExpandIntLibCall(SDNode* Node, bool isSigned,
2288                                                RTLIB::Libcall Call_I8,
2289                                                RTLIB::Libcall Call_I16,
2290                                                RTLIB::Libcall Call_I32,
2291                                                RTLIB::Libcall Call_I64,
2292                                                RTLIB::Libcall Call_I128) {
2293   RTLIB::Libcall LC;
2294   switch (Node->getValueType(0).getSimpleVT().SimpleTy) {
2295   default: assert(0 && "Unexpected request for libcall!");
2296   case MVT::i8:   LC = Call_I8; break;
2297   case MVT::i16:  LC = Call_I16; break;
2298   case MVT::i32:  LC = Call_I32; break;
2299   case MVT::i64:  LC = Call_I64; break;
2300   case MVT::i128: LC = Call_I128; break;
2301   }
2302   return ExpandLibCall(LC, Node, isSigned);
2303 }
2304
2305 /// isDivRemLibcallAvailable - Return true if divmod libcall is available.
2306 static bool isDivRemLibcallAvailable(SDNode *Node, bool isSigned,
2307                                      const TargetLowering &TLI) {
2308   RTLIB::Libcall LC;
2309   switch (Node->getValueType(0).getSimpleVT().SimpleTy) {
2310   default: assert(0 && "Unexpected request for libcall!");
2311   case MVT::i8:   LC= isSigned ? RTLIB::SDIVREM_I8  : RTLIB::UDIVREM_I8;  break;
2312   case MVT::i16:  LC= isSigned ? RTLIB::SDIVREM_I16 : RTLIB::UDIVREM_I16; break;
2313   case MVT::i32:  LC= isSigned ? RTLIB::SDIVREM_I32 : RTLIB::UDIVREM_I32; break;
2314   case MVT::i64:  LC= isSigned ? RTLIB::SDIVREM_I64 : RTLIB::UDIVREM_I64; break;
2315   case MVT::i128: LC= isSigned ? RTLIB::SDIVREM_I128:RTLIB::UDIVREM_I128; break;
2316   }
2317
2318   return TLI.getLibcallName(LC) != 0;
2319 }
2320
2321 /// UseDivRem - Only issue divrem libcall if both quotient and remainder are
2322 /// needed.
2323 static bool UseDivRem(SDNode *Node, bool isSigned, bool isDIV) {
2324   unsigned OtherOpcode = 0;
2325   if (isSigned)
2326     OtherOpcode = isDIV ? ISD::SREM : ISD::SDIV;
2327   else
2328     OtherOpcode = isDIV ? ISD::UREM : ISD::UDIV;
2329
2330   SDValue Op0 = Node->getOperand(0);
2331   SDValue Op1 = Node->getOperand(1);
2332   for (SDNode::use_iterator UI = Op0.getNode()->use_begin(),
2333          UE = Op0.getNode()->use_end(); UI != UE; ++UI) {
2334     SDNode *User = *UI;
2335     if (User == Node)
2336       continue;
2337     if (User->getOpcode() == OtherOpcode &&
2338         User->getOperand(0) == Op0 &&
2339         User->getOperand(1) == Op1)
2340       return true;
2341   }
2342   return false;
2343 }
2344
2345 /// ExpandDivRemLibCall - Issue libcalls to __{u}divmod to compute div / rem
2346 /// pairs.
2347 void
2348 SelectionDAGLegalize::ExpandDivRemLibCall(SDNode *Node,
2349                                           SmallVectorImpl<SDValue> &Results) {
2350   unsigned Opcode = Node->getOpcode();
2351   bool isSigned = Opcode == ISD::SDIVREM;
2352
2353   RTLIB::Libcall LC;
2354   switch (Node->getValueType(0).getSimpleVT().SimpleTy) {
2355   default: assert(0 && "Unexpected request for libcall!");
2356   case MVT::i8:   LC= isSigned ? RTLIB::SDIVREM_I8  : RTLIB::UDIVREM_I8;  break;
2357   case MVT::i16:  LC= isSigned ? RTLIB::SDIVREM_I16 : RTLIB::UDIVREM_I16; break;
2358   case MVT::i32:  LC= isSigned ? RTLIB::SDIVREM_I32 : RTLIB::UDIVREM_I32; break;
2359   case MVT::i64:  LC= isSigned ? RTLIB::SDIVREM_I64 : RTLIB::UDIVREM_I64; break;
2360   case MVT::i128: LC= isSigned ? RTLIB::SDIVREM_I128:RTLIB::UDIVREM_I128; break;
2361   }
2362
2363   // The input chain to this libcall is the entry node of the function.
2364   // Legalizing the call will automatically add the previous call to the
2365   // dependence.
2366   SDValue InChain = DAG.getEntryNode();
2367
2368   EVT RetVT = Node->getValueType(0);
2369   const Type *RetTy = RetVT.getTypeForEVT(*DAG.getContext());
2370
2371   TargetLowering::ArgListTy Args;
2372   TargetLowering::ArgListEntry Entry;
2373   for (unsigned i = 0, e = Node->getNumOperands(); i != e; ++i) {
2374     EVT ArgVT = Node->getOperand(i).getValueType();
2375     const Type *ArgTy = ArgVT.getTypeForEVT(*DAG.getContext());
2376     Entry.Node = Node->getOperand(i); Entry.Ty = ArgTy;
2377     Entry.isSExt = isSigned;
2378     Entry.isZExt = !isSigned;
2379     Args.push_back(Entry);
2380   }
2381
2382   // Also pass the return address of the remainder.
2383   SDValue FIPtr = DAG.CreateStackTemporary(RetVT);
2384   Entry.Node = FIPtr;
2385   Entry.Ty = RetTy->getPointerTo();
2386   Entry.isSExt = isSigned;
2387   Entry.isZExt = !isSigned;
2388   Args.push_back(Entry);
2389
2390   SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC),
2391                                          TLI.getPointerTy());
2392
2393   // Splice the libcall in wherever FindInputOutputChains tells us to.
2394   DebugLoc dl = Node->getDebugLoc();
2395   std::pair<SDValue, SDValue> CallInfo =
2396     TLI.LowerCallTo(InChain, RetTy, isSigned, !isSigned, false, false,
2397                     0, TLI.getLibcallCallingConv(LC), /*isTailCall=*/false,
2398                     /*isReturnValueUsed=*/true, Callee, Args, DAG, dl);
2399
2400   // Legalize the call sequence, starting with the chain.  This will advance
2401   // the LastCALLSEQ to the legalized version of the CALLSEQ_END node that
2402   // was added by LowerCallTo (guaranteeing proper serialization of calls).
2403   LegalizeOp(CallInfo.second);
2404
2405   // Remainder is loaded back from the stack frame.
2406   SDValue Rem = DAG.getLoad(RetVT, dl, getLastCALLSEQ(), FIPtr,
2407                             MachinePointerInfo(), false, false, 0);
2408   Results.push_back(CallInfo.first);
2409   Results.push_back(Rem);
2410 }
2411
2412 /// ExpandLegalINT_TO_FP - This function is responsible for legalizing a
2413 /// INT_TO_FP operation of the specified operand when the target requests that
2414 /// we expand it.  At this point, we know that the result and operand types are
2415 /// legal for the target.
2416 SDValue SelectionDAGLegalize::ExpandLegalINT_TO_FP(bool isSigned,
2417                                                    SDValue Op0,
2418                                                    EVT DestVT,
2419                                                    DebugLoc dl) {
2420   if (Op0.getValueType() == MVT::i32) {
2421     // simple 32-bit [signed|unsigned] integer to float/double expansion
2422
2423     // Get the stack frame index of a 8 byte buffer.
2424     SDValue StackSlot = DAG.CreateStackTemporary(MVT::f64);
2425
2426     // word offset constant for Hi/Lo address computation
2427     SDValue WordOff = DAG.getConstant(sizeof(int), TLI.getPointerTy());
2428     // set up Hi and Lo (into buffer) address based on endian
2429     SDValue Hi = StackSlot;
2430     SDValue Lo = DAG.getNode(ISD::ADD, dl,
2431                              TLI.getPointerTy(), StackSlot, WordOff);
2432     if (TLI.isLittleEndian())
2433       std::swap(Hi, Lo);
2434
2435     // if signed map to unsigned space
2436     SDValue Op0Mapped;
2437     if (isSigned) {
2438       // constant used to invert sign bit (signed to unsigned mapping)
2439       SDValue SignBit = DAG.getConstant(0x80000000u, MVT::i32);
2440       Op0Mapped = DAG.getNode(ISD::XOR, dl, MVT::i32, Op0, SignBit);
2441     } else {
2442       Op0Mapped = Op0;
2443     }
2444     // store the lo of the constructed double - based on integer input
2445     SDValue Store1 = DAG.getStore(DAG.getEntryNode(), dl,
2446                                   Op0Mapped, Lo, MachinePointerInfo(),
2447                                   false, false, 0);
2448     // initial hi portion of constructed double
2449     SDValue InitialHi = DAG.getConstant(0x43300000u, MVT::i32);
2450     // store the hi of the constructed double - biased exponent
2451     SDValue Store2 = DAG.getStore(Store1, dl, InitialHi, Hi,
2452                                   MachinePointerInfo(),
2453                                   false, false, 0);
2454     // load the constructed double
2455     SDValue Load = DAG.getLoad(MVT::f64, dl, Store2, StackSlot,
2456                                MachinePointerInfo(), false, false, 0);
2457     // FP constant to bias correct the final result
2458     SDValue Bias = DAG.getConstantFP(isSigned ?
2459                                      BitsToDouble(0x4330000080000000ULL) :
2460                                      BitsToDouble(0x4330000000000000ULL),
2461                                      MVT::f64);
2462     // subtract the bias
2463     SDValue Sub = DAG.getNode(ISD::FSUB, dl, MVT::f64, Load, Bias);
2464     // final result
2465     SDValue Result;
2466     // handle final rounding
2467     if (DestVT == MVT::f64) {
2468       // do nothing
2469       Result = Sub;
2470     } else if (DestVT.bitsLT(MVT::f64)) {
2471       Result = DAG.getNode(ISD::FP_ROUND, dl, DestVT, Sub,
2472                            DAG.getIntPtrConstant(0));
2473     } else if (DestVT.bitsGT(MVT::f64)) {
2474       Result = DAG.getNode(ISD::FP_EXTEND, dl, DestVT, Sub);
2475     }
2476     return Result;
2477   }
2478   assert(!isSigned && "Legalize cannot Expand SINT_TO_FP for i64 yet");
2479   // Code below here assumes !isSigned without checking again.
2480
2481   // Implementation of unsigned i64 to f64 following the algorithm in
2482   // __floatundidf in compiler_rt. This implementation has the advantage
2483   // of performing rounding correctly, both in the default rounding mode
2484   // and in all alternate rounding modes.
2485   // TODO: Generalize this for use with other types.
2486   if (Op0.getValueType() == MVT::i64 && DestVT == MVT::f64) {
2487     SDValue TwoP52 =
2488       DAG.getConstant(UINT64_C(0x4330000000000000), MVT::i64);
2489     SDValue TwoP84PlusTwoP52 =
2490       DAG.getConstantFP(BitsToDouble(UINT64_C(0x4530000000100000)), MVT::f64);
2491     SDValue TwoP84 =
2492       DAG.getConstant(UINT64_C(0x4530000000000000), MVT::i64);
2493
2494     SDValue Lo = DAG.getZeroExtendInReg(Op0, dl, MVT::i32);
2495     SDValue Hi = DAG.getNode(ISD::SRL, dl, MVT::i64, Op0,
2496                              DAG.getConstant(32, MVT::i64));
2497     SDValue LoOr = DAG.getNode(ISD::OR, dl, MVT::i64, Lo, TwoP52);
2498     SDValue HiOr = DAG.getNode(ISD::OR, dl, MVT::i64, Hi, TwoP84);
2499     SDValue LoFlt = DAG.getNode(ISD::BITCAST, dl, MVT::f64, LoOr);
2500     SDValue HiFlt = DAG.getNode(ISD::BITCAST, dl, MVT::f64, HiOr);
2501     SDValue HiSub = DAG.getNode(ISD::FSUB, dl, MVT::f64, HiFlt,
2502                                 TwoP84PlusTwoP52);
2503     return DAG.getNode(ISD::FADD, dl, MVT::f64, LoFlt, HiSub);
2504   }
2505
2506   // Implementation of unsigned i64 to f32.
2507   // TODO: Generalize this for use with other types.
2508   if (Op0.getValueType() == MVT::i64 && DestVT == MVT::f32) {
2509     // For unsigned conversions, convert them to signed conversions using the
2510     // algorithm from the x86_64 __floatundidf in compiler_rt.
2511     if (!isSigned) {
2512       SDValue Fast = DAG.getNode(ISD::SINT_TO_FP, dl, MVT::f32, Op0);
2513
2514       SDValue ShiftConst =
2515           DAG.getConstant(1, TLI.getShiftAmountTy(Op0.getValueType()));
2516       SDValue Shr = DAG.getNode(ISD::SRL, dl, MVT::i64, Op0, ShiftConst);
2517       SDValue AndConst = DAG.getConstant(1, MVT::i64);
2518       SDValue And = DAG.getNode(ISD::AND, dl, MVT::i64, Op0, AndConst);
2519       SDValue Or = DAG.getNode(ISD::OR, dl, MVT::i64, And, Shr);
2520
2521       SDValue SignCvt = DAG.getNode(ISD::SINT_TO_FP, dl, MVT::f32, Or);
2522       SDValue Slow = DAG.getNode(ISD::FADD, dl, MVT::f32, SignCvt, SignCvt);
2523
2524       // TODO: This really should be implemented using a branch rather than a
2525       // select.  We happen to get lucky and machinesink does the right
2526       // thing most of the time.  This would be a good candidate for a
2527       //pseudo-op, or, even better, for whole-function isel.
2528       SDValue SignBitTest = DAG.getSetCC(dl, TLI.getSetCCResultType(MVT::i64),
2529         Op0, DAG.getConstant(0, MVT::i64), ISD::SETLT);
2530       return DAG.getNode(ISD::SELECT, dl, MVT::f32, SignBitTest, Slow, Fast);
2531     }
2532
2533     // Otherwise, implement the fully general conversion.
2534
2535     SDValue And = DAG.getNode(ISD::AND, dl, MVT::i64, Op0,
2536          DAG.getConstant(UINT64_C(0xfffffffffffff800), MVT::i64));
2537     SDValue Or = DAG.getNode(ISD::OR, dl, MVT::i64, And,
2538          DAG.getConstant(UINT64_C(0x800), MVT::i64));
2539     SDValue And2 = DAG.getNode(ISD::AND, dl, MVT::i64, Op0,
2540          DAG.getConstant(UINT64_C(0x7ff), MVT::i64));
2541     SDValue Ne = DAG.getSetCC(dl, TLI.getSetCCResultType(MVT::i64),
2542                    And2, DAG.getConstant(UINT64_C(0), MVT::i64), ISD::SETNE);
2543     SDValue Sel = DAG.getNode(ISD::SELECT, dl, MVT::i64, Ne, Or, Op0);
2544     SDValue Ge = DAG.getSetCC(dl, TLI.getSetCCResultType(MVT::i64),
2545                    Op0, DAG.getConstant(UINT64_C(0x0020000000000000), MVT::i64),
2546                    ISD::SETUGE);
2547     SDValue Sel2 = DAG.getNode(ISD::SELECT, dl, MVT::i64, Ge, Sel, Op0);
2548     EVT SHVT = TLI.getShiftAmountTy(Sel2.getValueType());
2549
2550     SDValue Sh = DAG.getNode(ISD::SRL, dl, MVT::i64, Sel2,
2551                              DAG.getConstant(32, SHVT));
2552     SDValue Trunc = DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, Sh);
2553     SDValue Fcvt = DAG.getNode(ISD::UINT_TO_FP, dl, MVT::f64, Trunc);
2554     SDValue TwoP32 =
2555       DAG.getConstantFP(BitsToDouble(UINT64_C(0x41f0000000000000)), MVT::f64);
2556     SDValue Fmul = DAG.getNode(ISD::FMUL, dl, MVT::f64, TwoP32, Fcvt);
2557     SDValue Lo = DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, Sel2);
2558     SDValue Fcvt2 = DAG.getNode(ISD::UINT_TO_FP, dl, MVT::f64, Lo);
2559     SDValue Fadd = DAG.getNode(ISD::FADD, dl, MVT::f64, Fmul, Fcvt2);
2560     return DAG.getNode(ISD::FP_ROUND, dl, MVT::f32, Fadd,
2561                        DAG.getIntPtrConstant(0));
2562   }
2563
2564   SDValue Tmp1 = DAG.getNode(ISD::SINT_TO_FP, dl, DestVT, Op0);
2565
2566   SDValue SignSet = DAG.getSetCC(dl, TLI.getSetCCResultType(Op0.getValueType()),
2567                                  Op0, DAG.getConstant(0, Op0.getValueType()),
2568                                  ISD::SETLT);
2569   SDValue Zero = DAG.getIntPtrConstant(0), Four = DAG.getIntPtrConstant(4);
2570   SDValue CstOffset = DAG.getNode(ISD::SELECT, dl, Zero.getValueType(),
2571                                     SignSet, Four, Zero);
2572
2573   // If the sign bit of the integer is set, the large number will be treated
2574   // as a negative number.  To counteract this, the dynamic code adds an
2575   // offset depending on the data type.
2576   uint64_t FF;
2577   switch (Op0.getValueType().getSimpleVT().SimpleTy) {
2578   default: assert(0 && "Unsupported integer type!");
2579   case MVT::i8 : FF = 0x43800000ULL; break;  // 2^8  (as a float)
2580   case MVT::i16: FF = 0x47800000ULL; break;  // 2^16 (as a float)
2581   case MVT::i32: FF = 0x4F800000ULL; break;  // 2^32 (as a float)
2582   case MVT::i64: FF = 0x5F800000ULL; break;  // 2^64 (as a float)
2583   }
2584   if (TLI.isLittleEndian()) FF <<= 32;
2585   Constant *FudgeFactor = ConstantInt::get(
2586                                        Type::getInt64Ty(*DAG.getContext()), FF);
2587
2588   SDValue CPIdx = DAG.getConstantPool(FudgeFactor, TLI.getPointerTy());
2589   unsigned Alignment = cast<ConstantPoolSDNode>(CPIdx)->getAlignment();
2590   CPIdx = DAG.getNode(ISD::ADD, dl, TLI.getPointerTy(), CPIdx, CstOffset);
2591   Alignment = std::min(Alignment, 4u);
2592   SDValue FudgeInReg;
2593   if (DestVT == MVT::f32)
2594     FudgeInReg = DAG.getLoad(MVT::f32, dl, DAG.getEntryNode(), CPIdx,
2595                              MachinePointerInfo::getConstantPool(),
2596                              false, false, Alignment);
2597   else {
2598     FudgeInReg =
2599       LegalizeOp(DAG.getExtLoad(ISD::EXTLOAD, dl, DestVT,
2600                                 DAG.getEntryNode(), CPIdx,
2601                                 MachinePointerInfo::getConstantPool(),
2602                                 MVT::f32, false, false, Alignment));
2603   }
2604
2605   return DAG.getNode(ISD::FADD, dl, DestVT, Tmp1, FudgeInReg);
2606 }
2607
2608 /// PromoteLegalINT_TO_FP - This function is responsible for legalizing a
2609 /// *INT_TO_FP operation of the specified operand when the target requests that
2610 /// we promote it.  At this point, we know that the result and operand types are
2611 /// legal for the target, and that there is a legal UINT_TO_FP or SINT_TO_FP
2612 /// operation that takes a larger input.
2613 SDValue SelectionDAGLegalize::PromoteLegalINT_TO_FP(SDValue LegalOp,
2614                                                     EVT DestVT,
2615                                                     bool isSigned,
2616                                                     DebugLoc dl) {
2617   // First step, figure out the appropriate *INT_TO_FP operation to use.
2618   EVT NewInTy = LegalOp.getValueType();
2619
2620   unsigned OpToUse = 0;
2621
2622   // Scan for the appropriate larger type to use.
2623   while (1) {
2624     NewInTy = (MVT::SimpleValueType)(NewInTy.getSimpleVT().SimpleTy+1);
2625     assert(NewInTy.isInteger() && "Ran out of possibilities!");
2626
2627     // If the target supports SINT_TO_FP of this type, use it.
2628     if (TLI.isOperationLegalOrCustom(ISD::SINT_TO_FP, NewInTy)) {
2629       OpToUse = ISD::SINT_TO_FP;
2630       break;
2631     }
2632     if (isSigned) continue;
2633
2634     // If the target supports UINT_TO_FP of this type, use it.
2635     if (TLI.isOperationLegalOrCustom(ISD::UINT_TO_FP, NewInTy)) {
2636       OpToUse = ISD::UINT_TO_FP;
2637       break;
2638     }
2639
2640     // Otherwise, try a larger type.
2641   }
2642
2643   // Okay, we found the operation and type to use.  Zero extend our input to the
2644   // desired type then run the operation on it.
2645   return DAG.getNode(OpToUse, dl, DestVT,
2646                      DAG.getNode(isSigned ? ISD::SIGN_EXTEND : ISD::ZERO_EXTEND,
2647                                  dl, NewInTy, LegalOp));
2648 }
2649
2650 /// PromoteLegalFP_TO_INT - This function is responsible for legalizing a
2651 /// FP_TO_*INT operation of the specified operand when the target requests that
2652 /// we promote it.  At this point, we know that the result and operand types are
2653 /// legal for the target, and that there is a legal FP_TO_UINT or FP_TO_SINT
2654 /// operation that returns a larger result.
2655 SDValue SelectionDAGLegalize::PromoteLegalFP_TO_INT(SDValue LegalOp,
2656                                                     EVT DestVT,
2657                                                     bool isSigned,
2658                                                     DebugLoc dl) {
2659   // First step, figure out the appropriate FP_TO*INT operation to use.
2660   EVT NewOutTy = DestVT;
2661
2662   unsigned OpToUse = 0;
2663
2664   // Scan for the appropriate larger type to use.
2665   while (1) {
2666     NewOutTy = (MVT::SimpleValueType)(NewOutTy.getSimpleVT().SimpleTy+1);
2667     assert(NewOutTy.isInteger() && "Ran out of possibilities!");
2668
2669     if (TLI.isOperationLegalOrCustom(ISD::FP_TO_SINT, NewOutTy)) {
2670       OpToUse = ISD::FP_TO_SINT;
2671       break;
2672     }
2673
2674     if (TLI.isOperationLegalOrCustom(ISD::FP_TO_UINT, NewOutTy)) {
2675       OpToUse = ISD::FP_TO_UINT;
2676       break;
2677     }
2678
2679     // Otherwise, try a larger type.
2680   }
2681
2682
2683   // Okay, we found the operation and type to use.
2684   SDValue Operation = DAG.getNode(OpToUse, dl, NewOutTy, LegalOp);
2685
2686   // Truncate the result of the extended FP_TO_*INT operation to the desired
2687   // size.
2688   return DAG.getNode(ISD::TRUNCATE, dl, DestVT, Operation);
2689 }
2690
2691 /// ExpandBSWAP - Open code the operations for BSWAP of the specified operation.
2692 ///
2693 SDValue SelectionDAGLegalize::ExpandBSWAP(SDValue Op, DebugLoc dl) {
2694   EVT VT = Op.getValueType();
2695   EVT SHVT = TLI.getShiftAmountTy(VT);
2696   SDValue Tmp1, Tmp2, Tmp3, Tmp4, Tmp5, Tmp6, Tmp7, Tmp8;
2697   switch (VT.getSimpleVT().SimpleTy) {
2698   default: assert(0 && "Unhandled Expand type in BSWAP!");
2699   case MVT::i16:
2700     Tmp2 = DAG.getNode(ISD::SHL, dl, VT, Op, DAG.getConstant(8, SHVT));
2701     Tmp1 = DAG.getNode(ISD::SRL, dl, VT, Op, DAG.getConstant(8, SHVT));
2702     return DAG.getNode(ISD::OR, dl, VT, Tmp1, Tmp2);
2703   case MVT::i32:
2704     Tmp4 = DAG.getNode(ISD::SHL, dl, VT, Op, DAG.getConstant(24, SHVT));
2705     Tmp3 = DAG.getNode(ISD::SHL, dl, VT, Op, DAG.getConstant(8, SHVT));
2706     Tmp2 = DAG.getNode(ISD::SRL, dl, VT, Op, DAG.getConstant(8, SHVT));
2707     Tmp1 = DAG.getNode(ISD::SRL, dl, VT, Op, DAG.getConstant(24, SHVT));
2708     Tmp3 = DAG.getNode(ISD::AND, dl, VT, Tmp3, DAG.getConstant(0xFF0000, VT));
2709     Tmp2 = DAG.getNode(ISD::AND, dl, VT, Tmp2, DAG.getConstant(0xFF00, VT));
2710     Tmp4 = DAG.getNode(ISD::OR, dl, VT, Tmp4, Tmp3);
2711     Tmp2 = DAG.getNode(ISD::OR, dl, VT, Tmp2, Tmp1);
2712     return DAG.getNode(ISD::OR, dl, VT, Tmp4, Tmp2);
2713   case MVT::i64:
2714     Tmp8 = DAG.getNode(ISD::SHL, dl, VT, Op, DAG.getConstant(56, SHVT));
2715     Tmp7 = DAG.getNode(ISD::SHL, dl, VT, Op, DAG.getConstant(40, SHVT));
2716     Tmp6 = DAG.getNode(ISD::SHL, dl, VT, Op, DAG.getConstant(24, SHVT));
2717     Tmp5 = DAG.getNode(ISD::SHL, dl, VT, Op, DAG.getConstant(8, SHVT));
2718     Tmp4 = DAG.getNode(ISD::SRL, dl, VT, Op, DAG.getConstant(8, SHVT));
2719     Tmp3 = DAG.getNode(ISD::SRL, dl, VT, Op, DAG.getConstant(24, SHVT));
2720     Tmp2 = DAG.getNode(ISD::SRL, dl, VT, Op, DAG.getConstant(40, SHVT));
2721     Tmp1 = DAG.getNode(ISD::SRL, dl, VT, Op, DAG.getConstant(56, SHVT));
2722     Tmp7 = DAG.getNode(ISD::AND, dl, VT, Tmp7, DAG.getConstant(255ULL<<48, VT));
2723     Tmp6 = DAG.getNode(ISD::AND, dl, VT, Tmp6, DAG.getConstant(255ULL<<40, VT));
2724     Tmp5 = DAG.getNode(ISD::AND, dl, VT, Tmp5, DAG.getConstant(255ULL<<32, VT));
2725     Tmp4 = DAG.getNode(ISD::AND, dl, VT, Tmp4, DAG.getConstant(255ULL<<24, VT));
2726     Tmp3 = DAG.getNode(ISD::AND, dl, VT, Tmp3, DAG.getConstant(255ULL<<16, VT));
2727     Tmp2 = DAG.getNode(ISD::AND, dl, VT, Tmp2, DAG.getConstant(255ULL<<8 , VT));
2728     Tmp8 = DAG.getNode(ISD::OR, dl, VT, Tmp8, Tmp7);
2729     Tmp6 = DAG.getNode(ISD::OR, dl, VT, Tmp6, Tmp5);
2730     Tmp4 = DAG.getNode(ISD::OR, dl, VT, Tmp4, Tmp3);
2731     Tmp2 = DAG.getNode(ISD::OR, dl, VT, Tmp2, Tmp1);
2732     Tmp8 = DAG.getNode(ISD::OR, dl, VT, Tmp8, Tmp6);
2733     Tmp4 = DAG.getNode(ISD::OR, dl, VT, Tmp4, Tmp2);
2734     return DAG.getNode(ISD::OR, dl, VT, Tmp8, Tmp4);
2735   }
2736 }
2737
2738 /// SplatByte - Distribute ByteVal over NumBits bits.
2739 // FIXME: Move this helper to a common place.
2740 static APInt SplatByte(unsigned NumBits, uint8_t ByteVal) {
2741   APInt Val = APInt(NumBits, ByteVal);
2742   unsigned Shift = 8;
2743   for (unsigned i = NumBits; i > 8; i >>= 1) {
2744     Val = (Val << Shift) | Val;
2745     Shift <<= 1;
2746   }
2747   return Val;
2748 }
2749
2750 /// ExpandBitCount - Expand the specified bitcount instruction into operations.
2751 ///
2752 SDValue SelectionDAGLegalize::ExpandBitCount(unsigned Opc, SDValue Op,
2753                                              DebugLoc dl) {
2754   switch (Opc) {
2755   default: assert(0 && "Cannot expand this yet!");
2756   case ISD::CTPOP: {
2757     EVT VT = Op.getValueType();
2758     EVT ShVT = TLI.getShiftAmountTy(VT);
2759     unsigned Len = VT.getSizeInBits();
2760
2761     assert(VT.isInteger() && Len <= 128 && Len % 8 == 0 &&
2762            "CTPOP not implemented for this type.");
2763
2764     // This is the "best" algorithm from
2765     // http://graphics.stanford.edu/~seander/bithacks.html#CountBitsSetParallel
2766
2767     SDValue Mask55 = DAG.getConstant(SplatByte(Len, 0x55), VT);
2768     SDValue Mask33 = DAG.getConstant(SplatByte(Len, 0x33), VT);
2769     SDValue Mask0F = DAG.getConstant(SplatByte(Len, 0x0F), VT);
2770     SDValue Mask01 = DAG.getConstant(SplatByte(Len, 0x01), VT);
2771
2772     // v = v - ((v >> 1) & 0x55555555...)
2773     Op = DAG.getNode(ISD::SUB, dl, VT, Op,
2774                      DAG.getNode(ISD::AND, dl, VT,
2775                                  DAG.getNode(ISD::SRL, dl, VT, Op,
2776                                              DAG.getConstant(1, ShVT)),
2777                                  Mask55));
2778     // v = (v & 0x33333333...) + ((v >> 2) & 0x33333333...)
2779     Op = DAG.getNode(ISD::ADD, dl, VT,
2780                      DAG.getNode(ISD::AND, dl, VT, Op, Mask33),
2781                      DAG.getNode(ISD::AND, dl, VT,
2782                                  DAG.getNode(ISD::SRL, dl, VT, Op,
2783                                              DAG.getConstant(2, ShVT)),
2784                                  Mask33));
2785     // v = (v + (v >> 4)) & 0x0F0F0F0F...
2786     Op = DAG.getNode(ISD::AND, dl, VT,
2787                      DAG.getNode(ISD::ADD, dl, VT, Op,
2788                                  DAG.getNode(ISD::SRL, dl, VT, Op,
2789                                              DAG.getConstant(4, ShVT))),
2790                      Mask0F);
2791     // v = (v * 0x01010101...) >> (Len - 8)
2792     Op = DAG.getNode(ISD::SRL, dl, VT,
2793                      DAG.getNode(ISD::MUL, dl, VT, Op, Mask01),
2794                      DAG.getConstant(Len - 8, ShVT));
2795
2796     return Op;
2797   }
2798   case ISD::CTLZ: {
2799     // for now, we do this:
2800     // x = x | (x >> 1);
2801     // x = x | (x >> 2);
2802     // ...
2803     // x = x | (x >>16);
2804     // x = x | (x >>32); // for 64-bit input
2805     // return popcount(~x);
2806     //
2807     // but see also: http://www.hackersdelight.org/HDcode/nlz.cc
2808     EVT VT = Op.getValueType();
2809     EVT ShVT = TLI.getShiftAmountTy(VT);
2810     unsigned len = VT.getSizeInBits();
2811     for (unsigned i = 0; (1U << i) <= (len / 2); ++i) {
2812       SDValue Tmp3 = DAG.getConstant(1ULL << i, ShVT);
2813       Op = DAG.getNode(ISD::OR, dl, VT, Op,
2814                        DAG.getNode(ISD::SRL, dl, VT, Op, Tmp3));
2815     }
2816     Op = DAG.getNOT(dl, Op, VT);
2817     return DAG.getNode(ISD::CTPOP, dl, VT, Op);
2818   }
2819   case ISD::CTTZ: {
2820     // for now, we use: { return popcount(~x & (x - 1)); }
2821     // unless the target has ctlz but not ctpop, in which case we use:
2822     // { return 32 - nlz(~x & (x-1)); }
2823     // see also http://www.hackersdelight.org/HDcode/ntz.cc
2824     EVT VT = Op.getValueType();
2825     SDValue Tmp3 = DAG.getNode(ISD::AND, dl, VT,
2826                                DAG.getNOT(dl, Op, VT),
2827                                DAG.getNode(ISD::SUB, dl, VT, Op,
2828                                            DAG.getConstant(1, VT)));
2829     // If ISD::CTLZ is legal and CTPOP isn't, then do that instead.
2830     if (!TLI.isOperationLegalOrCustom(ISD::CTPOP, VT) &&
2831         TLI.isOperationLegalOrCustom(ISD::CTLZ, VT))
2832       return DAG.getNode(ISD::SUB, dl, VT,
2833                          DAG.getConstant(VT.getSizeInBits(), VT),
2834                          DAG.getNode(ISD::CTLZ, dl, VT, Tmp3));
2835     return DAG.getNode(ISD::CTPOP, dl, VT, Tmp3);
2836   }
2837   }
2838 }
2839
2840 std::pair <SDValue, SDValue> SelectionDAGLegalize::ExpandAtomic(SDNode *Node) {
2841   unsigned Opc = Node->getOpcode();
2842   MVT VT = cast<AtomicSDNode>(Node)->getMemoryVT().getSimpleVT();
2843   RTLIB::Libcall LC;
2844
2845   switch (Opc) {
2846   default:
2847     llvm_unreachable("Unhandled atomic intrinsic Expand!");
2848     break;
2849   case ISD::ATOMIC_SWAP:
2850     switch (VT.SimpleTy) {
2851     default: llvm_unreachable("Unexpected value type for atomic!");
2852     case MVT::i8:  LC = RTLIB::SYNC_LOCK_TEST_AND_SET_1; break;
2853     case MVT::i16: LC = RTLIB::SYNC_LOCK_TEST_AND_SET_2; break;
2854     case MVT::i32: LC = RTLIB::SYNC_LOCK_TEST_AND_SET_4; break;
2855     case MVT::i64: LC = RTLIB::SYNC_LOCK_TEST_AND_SET_8; break;
2856     }
2857     break;
2858   case ISD::ATOMIC_CMP_SWAP:
2859     switch (VT.SimpleTy) {
2860     default: llvm_unreachable("Unexpected value type for atomic!");
2861     case MVT::i8:  LC = RTLIB::SYNC_VAL_COMPARE_AND_SWAP_1; break;
2862     case MVT::i16: LC = RTLIB::SYNC_VAL_COMPARE_AND_SWAP_2; break;
2863     case MVT::i32: LC = RTLIB::SYNC_VAL_COMPARE_AND_SWAP_4; break;
2864     case MVT::i64: LC = RTLIB::SYNC_VAL_COMPARE_AND_SWAP_8; break;
2865     }
2866     break;
2867   case ISD::ATOMIC_LOAD_ADD:
2868     switch (VT.SimpleTy) {
2869     default: llvm_unreachable("Unexpected value type for atomic!");
2870     case MVT::i8:  LC = RTLIB::SYNC_FETCH_AND_ADD_1; break;
2871     case MVT::i16: LC = RTLIB::SYNC_FETCH_AND_ADD_2; break;
2872     case MVT::i32: LC = RTLIB::SYNC_FETCH_AND_ADD_4; break;
2873     case MVT::i64: LC = RTLIB::SYNC_FETCH_AND_ADD_8; break;
2874     }
2875     break;
2876   case ISD::ATOMIC_LOAD_SUB:
2877     switch (VT.SimpleTy) {
2878     default: llvm_unreachable("Unexpected value type for atomic!");
2879     case MVT::i8:  LC = RTLIB::SYNC_FETCH_AND_SUB_1; break;
2880     case MVT::i16: LC = RTLIB::SYNC_FETCH_AND_SUB_2; break;
2881     case MVT::i32: LC = RTLIB::SYNC_FETCH_AND_SUB_4; break;
2882     case MVT::i64: LC = RTLIB::SYNC_FETCH_AND_SUB_8; break;
2883     }
2884     break;
2885   case ISD::ATOMIC_LOAD_AND:
2886     switch (VT.SimpleTy) {
2887     default: llvm_unreachable("Unexpected value type for atomic!");
2888     case MVT::i8:  LC = RTLIB::SYNC_FETCH_AND_AND_1; break;
2889     case MVT::i16: LC = RTLIB::SYNC_FETCH_AND_AND_2; break;
2890     case MVT::i32: LC = RTLIB::SYNC_FETCH_AND_AND_4; break;
2891     case MVT::i64: LC = RTLIB::SYNC_FETCH_AND_AND_8; break;
2892     }
2893     break;
2894   case ISD::ATOMIC_LOAD_OR:
2895     switch (VT.SimpleTy) {
2896     default: llvm_unreachable("Unexpected value type for atomic!");
2897     case MVT::i8:  LC = RTLIB::SYNC_FETCH_AND_OR_1; break;
2898     case MVT::i16: LC = RTLIB::SYNC_FETCH_AND_OR_2; break;
2899     case MVT::i32: LC = RTLIB::SYNC_FETCH_AND_OR_4; break;
2900     case MVT::i64: LC = RTLIB::SYNC_FETCH_AND_OR_8; break;
2901     }
2902     break;
2903   case ISD::ATOMIC_LOAD_XOR:
2904     switch (VT.SimpleTy) {
2905     default: llvm_unreachable("Unexpected value type for atomic!");
2906     case MVT::i8:  LC = RTLIB::SYNC_FETCH_AND_XOR_1; break;
2907     case MVT::i16: LC = RTLIB::SYNC_FETCH_AND_XOR_2; break;
2908     case MVT::i32: LC = RTLIB::SYNC_FETCH_AND_XOR_4; break;
2909     case MVT::i64: LC = RTLIB::SYNC_FETCH_AND_XOR_8; break;
2910     }
2911     break;
2912   case ISD::ATOMIC_LOAD_NAND:
2913     switch (VT.SimpleTy) {
2914     default: llvm_unreachable("Unexpected value type for atomic!");
2915     case MVT::i8:  LC = RTLIB::SYNC_FETCH_AND_NAND_1; break;
2916     case MVT::i16: LC = RTLIB::SYNC_FETCH_AND_NAND_2; break;
2917     case MVT::i32: LC = RTLIB::SYNC_FETCH_AND_NAND_4; break;
2918     case MVT::i64: LC = RTLIB::SYNC_FETCH_AND_NAND_8; break;
2919     }
2920     break;
2921   }
2922
2923   return ExpandChainLibCall(LC, Node, false);
2924 }
2925
2926 void SelectionDAGLegalize::ExpandNode(SDNode *Node,
2927                                       SmallVectorImpl<SDValue> &Results) {
2928   DebugLoc dl = Node->getDebugLoc();
2929   SDValue Tmp1, Tmp2, Tmp3, Tmp4;
2930   switch (Node->getOpcode()) {
2931   case ISD::CTPOP:
2932   case ISD::CTLZ:
2933   case ISD::CTTZ:
2934     Tmp1 = ExpandBitCount(Node->getOpcode(), Node->getOperand(0), dl);
2935     Results.push_back(Tmp1);
2936     break;
2937   case ISD::BSWAP:
2938     Results.push_back(ExpandBSWAP(Node->getOperand(0), dl));
2939     break;
2940   case ISD::FRAMEADDR:
2941   case ISD::RETURNADDR:
2942   case ISD::FRAME_TO_ARGS_OFFSET:
2943     Results.push_back(DAG.getConstant(0, Node->getValueType(0)));
2944     break;
2945   case ISD::FLT_ROUNDS_:
2946     Results.push_back(DAG.getConstant(1, Node->getValueType(0)));
2947     break;
2948   case ISD::EH_RETURN:
2949   case ISD::EH_LABEL:
2950   case ISD::PREFETCH:
2951   case ISD::VAEND:
2952   case ISD::EH_SJLJ_LONGJMP:
2953   case ISD::EH_SJLJ_DISPATCHSETUP:
2954     // If the target didn't expand these, there's nothing to do, so just
2955     // preserve the chain and be done.
2956     Results.push_back(Node->getOperand(0));
2957     break;
2958   case ISD::EH_SJLJ_SETJMP:
2959     // If the target didn't expand this, just return 'zero' and preserve the
2960     // chain.
2961     Results.push_back(DAG.getConstant(0, MVT::i32));
2962     Results.push_back(Node->getOperand(0));
2963     break;
2964   case ISD::MEMBARRIER: {
2965     // If the target didn't lower this, lower it to '__sync_synchronize()' call
2966     TargetLowering::ArgListTy Args;
2967     std::pair<SDValue, SDValue> CallResult =
2968       TLI.LowerCallTo(Node->getOperand(0), Type::getVoidTy(*DAG.getContext()),
2969                       false, false, false, false, 0, CallingConv::C,
2970                       /*isTailCall=*/false,
2971                       /*isReturnValueUsed=*/true,
2972                       DAG.getExternalSymbol("__sync_synchronize",
2973                                             TLI.getPointerTy()),
2974                       Args, DAG, dl);
2975     Results.push_back(CallResult.second);
2976     break;
2977   }
2978   // By default, atomic intrinsics are marked Legal and lowered. Targets
2979   // which don't support them directly, however, may want libcalls, in which
2980   // case they mark them Expand, and we get here.
2981   case ISD::ATOMIC_SWAP:
2982   case ISD::ATOMIC_LOAD_ADD:
2983   case ISD::ATOMIC_LOAD_SUB:
2984   case ISD::ATOMIC_LOAD_AND:
2985   case ISD::ATOMIC_LOAD_OR:
2986   case ISD::ATOMIC_LOAD_XOR:
2987   case ISD::ATOMIC_LOAD_NAND:
2988   case ISD::ATOMIC_LOAD_MIN:
2989   case ISD::ATOMIC_LOAD_MAX:
2990   case ISD::ATOMIC_LOAD_UMIN:
2991   case ISD::ATOMIC_LOAD_UMAX:
2992   case ISD::ATOMIC_CMP_SWAP: {
2993     std::pair<SDValue, SDValue> Tmp = ExpandAtomic(Node);
2994     Results.push_back(Tmp.first);
2995     Results.push_back(Tmp.second);
2996     break;
2997   }
2998   case ISD::DYNAMIC_STACKALLOC:
2999     ExpandDYNAMIC_STACKALLOC(Node, Results);
3000     break;
3001   case ISD::MERGE_VALUES:
3002     for (unsigned i = 0; i < Node->getNumValues(); i++)
3003       Results.push_back(Node->getOperand(i));
3004     break;
3005   case ISD::UNDEF: {
3006     EVT VT = Node->getValueType(0);
3007     if (VT.isInteger())
3008       Results.push_back(DAG.getConstant(0, VT));
3009     else {
3010       assert(VT.isFloatingPoint() && "Unknown value type!");
3011       Results.push_back(DAG.getConstantFP(0, VT));
3012     }
3013     break;
3014   }
3015   case ISD::TRAP: {
3016     // If this operation is not supported, lower it to 'abort()' call
3017     TargetLowering::ArgListTy Args;
3018     std::pair<SDValue, SDValue> CallResult =
3019       TLI.LowerCallTo(Node->getOperand(0), Type::getVoidTy(*DAG.getContext()),
3020                       false, false, false, false, 0, CallingConv::C,
3021                       /*isTailCall=*/false,
3022                       /*isReturnValueUsed=*/true,
3023                       DAG.getExternalSymbol("abort", TLI.getPointerTy()),
3024                       Args, DAG, dl);
3025     Results.push_back(CallResult.second);
3026     break;
3027   }
3028   case ISD::FP_ROUND:
3029   case ISD::BITCAST:
3030     Tmp1 = EmitStackConvert(Node->getOperand(0), Node->getValueType(0),
3031                             Node->getValueType(0), dl);
3032     Results.push_back(Tmp1);
3033     break;
3034   case ISD::FP_EXTEND:
3035     Tmp1 = EmitStackConvert(Node->getOperand(0),
3036                             Node->getOperand(0).getValueType(),
3037                             Node->getValueType(0), dl);
3038     Results.push_back(Tmp1);
3039     break;
3040   case ISD::SIGN_EXTEND_INREG: {
3041     // NOTE: we could fall back on load/store here too for targets without
3042     // SAR.  However, it is doubtful that any exist.
3043     EVT ExtraVT = cast<VTSDNode>(Node->getOperand(1))->getVT();
3044     EVT VT = Node->getValueType(0);
3045     EVT ShiftAmountTy = TLI.getShiftAmountTy(VT);
3046     if (VT.isVector())
3047       ShiftAmountTy = VT;
3048     unsigned BitsDiff = VT.getScalarType().getSizeInBits() -
3049                         ExtraVT.getScalarType().getSizeInBits();
3050     SDValue ShiftCst = DAG.getConstant(BitsDiff, ShiftAmountTy);
3051     Tmp1 = DAG.getNode(ISD::SHL, dl, Node->getValueType(0),
3052                        Node->getOperand(0), ShiftCst);
3053     Tmp1 = DAG.getNode(ISD::SRA, dl, Node->getValueType(0), Tmp1, ShiftCst);
3054     Results.push_back(Tmp1);
3055     break;
3056   }
3057   case ISD::FP_ROUND_INREG: {
3058     // The only way we can lower this is to turn it into a TRUNCSTORE,
3059     // EXTLOAD pair, targeting a temporary location (a stack slot).
3060
3061     // NOTE: there is a choice here between constantly creating new stack
3062     // slots and always reusing the same one.  We currently always create
3063     // new ones, as reuse may inhibit scheduling.
3064     EVT ExtraVT = cast<VTSDNode>(Node->getOperand(1))->getVT();
3065     Tmp1 = EmitStackConvert(Node->getOperand(0), ExtraVT,
3066                             Node->getValueType(0), dl);
3067     Results.push_back(Tmp1);
3068     break;
3069   }
3070   case ISD::SINT_TO_FP:
3071   case ISD::UINT_TO_FP:
3072     Tmp1 = ExpandLegalINT_TO_FP(Node->getOpcode() == ISD::SINT_TO_FP,
3073                                 Node->getOperand(0), Node->getValueType(0), dl);
3074     Results.push_back(Tmp1);
3075     break;
3076   case ISD::FP_TO_UINT: {
3077     SDValue True, False;
3078     EVT VT =  Node->getOperand(0).getValueType();
3079     EVT NVT = Node->getValueType(0);
3080     APFloat apf(APInt::getNullValue(VT.getSizeInBits()));
3081     APInt x = APInt::getSignBit(NVT.getSizeInBits());
3082     (void)apf.convertFromAPInt(x, false, APFloat::rmNearestTiesToEven);
3083     Tmp1 = DAG.getConstantFP(apf, VT);
3084     Tmp2 = DAG.getSetCC(dl, TLI.getSetCCResultType(VT),
3085                         Node->getOperand(0),
3086                         Tmp1, ISD::SETLT);
3087     True = DAG.getNode(ISD::FP_TO_SINT, dl, NVT, Node->getOperand(0));
3088     False = DAG.getNode(ISD::FP_TO_SINT, dl, NVT,
3089                         DAG.getNode(ISD::FSUB, dl, VT,
3090                                     Node->getOperand(0), Tmp1));
3091     False = DAG.getNode(ISD::XOR, dl, NVT, False,
3092                         DAG.getConstant(x, NVT));
3093     Tmp1 = DAG.getNode(ISD::SELECT, dl, NVT, Tmp2, True, False);
3094     Results.push_back(Tmp1);
3095     break;
3096   }
3097   case ISD::VAARG: {
3098     const Value *V = cast<SrcValueSDNode>(Node->getOperand(2))->getValue();
3099     EVT VT = Node->getValueType(0);
3100     Tmp1 = Node->getOperand(0);
3101     Tmp2 = Node->getOperand(1);
3102     unsigned Align = Node->getConstantOperandVal(3);
3103
3104     SDValue VAListLoad = DAG.getLoad(TLI.getPointerTy(), dl, Tmp1, Tmp2,
3105                                      MachinePointerInfo(V), false, false, 0);
3106     SDValue VAList = VAListLoad;
3107
3108     if (Align > TLI.getMinStackArgumentAlignment()) {
3109       assert(((Align & (Align-1)) == 0) && "Expected Align to be a power of 2");
3110
3111       VAList = DAG.getNode(ISD::ADD, dl, TLI.getPointerTy(), VAList,
3112                            DAG.getConstant(Align - 1,
3113                                            TLI.getPointerTy()));
3114
3115       VAList = DAG.getNode(ISD::AND, dl, TLI.getPointerTy(), VAList,
3116                            DAG.getConstant(-(int64_t)Align,
3117                                            TLI.getPointerTy()));
3118     }
3119
3120     // Increment the pointer, VAList, to the next vaarg
3121     Tmp3 = DAG.getNode(ISD::ADD, dl, TLI.getPointerTy(), VAList,
3122                        DAG.getConstant(TLI.getTargetData()->
3123                           getTypeAllocSize(VT.getTypeForEVT(*DAG.getContext())),
3124                                        TLI.getPointerTy()));
3125     // Store the incremented VAList to the legalized pointer
3126     Tmp3 = DAG.getStore(VAListLoad.getValue(1), dl, Tmp3, Tmp2,
3127                         MachinePointerInfo(V), false, false, 0);
3128     // Load the actual argument out of the pointer VAList
3129     Results.push_back(DAG.getLoad(VT, dl, Tmp3, VAList, MachinePointerInfo(),
3130                                   false, false, 0));
3131     Results.push_back(Results[0].getValue(1));
3132     break;
3133   }
3134   case ISD::VACOPY: {
3135     // This defaults to loading a pointer from the input and storing it to the
3136     // output, returning the chain.
3137     const Value *VD = cast<SrcValueSDNode>(Node->getOperand(3))->getValue();
3138     const Value *VS = cast<SrcValueSDNode>(Node->getOperand(4))->getValue();
3139     Tmp1 = DAG.getLoad(TLI.getPointerTy(), dl, Node->getOperand(0),
3140                        Node->getOperand(2), MachinePointerInfo(VS),
3141                        false, false, 0);
3142     Tmp1 = DAG.getStore(Tmp1.getValue(1), dl, Tmp1, Node->getOperand(1),
3143                         MachinePointerInfo(VD), false, false, 0);
3144     Results.push_back(Tmp1);
3145     break;
3146   }
3147   case ISD::EXTRACT_VECTOR_ELT:
3148     if (Node->getOperand(0).getValueType().getVectorNumElements() == 1)
3149       // This must be an access of the only element.  Return it.
3150       Tmp1 = DAG.getNode(ISD::BITCAST, dl, Node->getValueType(0),
3151                          Node->getOperand(0));
3152     else
3153       Tmp1 = ExpandExtractFromVectorThroughStack(SDValue(Node, 0));
3154     Results.push_back(Tmp1);
3155     break;
3156   case ISD::EXTRACT_SUBVECTOR:
3157     Results.push_back(ExpandExtractFromVectorThroughStack(SDValue(Node, 0)));
3158     break;
3159   case ISD::INSERT_SUBVECTOR:
3160     Results.push_back(ExpandInsertToVectorThroughStack(SDValue(Node, 0)));
3161     break;
3162   case ISD::CONCAT_VECTORS: {
3163     Results.push_back(ExpandVectorBuildThroughStack(Node));
3164     break;
3165   }
3166   case ISD::SCALAR_TO_VECTOR:
3167     Results.push_back(ExpandSCALAR_TO_VECTOR(Node));
3168     break;
3169   case ISD::INSERT_VECTOR_ELT:
3170     Results.push_back(ExpandINSERT_VECTOR_ELT(Node->getOperand(0),
3171                                               Node->getOperand(1),
3172                                               Node->getOperand(2), dl));
3173     break;
3174   case ISD::VECTOR_SHUFFLE: {
3175     SmallVector<int, 8> Mask;
3176     cast<ShuffleVectorSDNode>(Node)->getMask(Mask);
3177
3178     EVT VT = Node->getValueType(0);
3179     EVT EltVT = VT.getVectorElementType();
3180     if (!TLI.isTypeLegal(EltVT))
3181       EltVT = TLI.getTypeToTransformTo(*DAG.getContext(), EltVT);
3182     unsigned NumElems = VT.getVectorNumElements();
3183     SmallVector<SDValue, 8> Ops;
3184     for (unsigned i = 0; i != NumElems; ++i) {
3185       if (Mask[i] < 0) {
3186         Ops.push_back(DAG.getUNDEF(EltVT));
3187         continue;
3188       }
3189       unsigned Idx = Mask[i];
3190       if (Idx < NumElems)
3191         Ops.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, EltVT,
3192                                   Node->getOperand(0),
3193                                   DAG.getIntPtrConstant(Idx)));
3194       else
3195         Ops.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, EltVT,
3196                                   Node->getOperand(1),
3197                                   DAG.getIntPtrConstant(Idx - NumElems)));
3198     }
3199     Tmp1 = DAG.getNode(ISD::BUILD_VECTOR, dl, VT, &Ops[0], Ops.size());
3200     Results.push_back(Tmp1);
3201     break;
3202   }
3203   case ISD::EXTRACT_ELEMENT: {
3204     EVT OpTy = Node->getOperand(0).getValueType();
3205     if (cast<ConstantSDNode>(Node->getOperand(1))->getZExtValue()) {
3206       // 1 -> Hi
3207       Tmp1 = DAG.getNode(ISD::SRL, dl, OpTy, Node->getOperand(0),
3208                          DAG.getConstant(OpTy.getSizeInBits()/2,
3209                     TLI.getShiftAmountTy(Node->getOperand(0).getValueType())));
3210       Tmp1 = DAG.getNode(ISD::TRUNCATE, dl, Node->getValueType(0), Tmp1);
3211     } else {
3212       // 0 -> Lo
3213       Tmp1 = DAG.getNode(ISD::TRUNCATE, dl, Node->getValueType(0),
3214                          Node->getOperand(0));
3215     }
3216     Results.push_back(Tmp1);
3217     break;
3218   }
3219   case ISD::STACKSAVE:
3220     // Expand to CopyFromReg if the target set
3221     // StackPointerRegisterToSaveRestore.
3222     if (unsigned SP = TLI.getStackPointerRegisterToSaveRestore()) {
3223       Results.push_back(DAG.getCopyFromReg(Node->getOperand(0), dl, SP,
3224                                            Node->getValueType(0)));
3225       Results.push_back(Results[0].getValue(1));
3226     } else {
3227       Results.push_back(DAG.getUNDEF(Node->getValueType(0)));
3228       Results.push_back(Node->getOperand(0));
3229     }
3230     break;
3231   case ISD::STACKRESTORE:
3232     // Expand to CopyToReg if the target set
3233     // StackPointerRegisterToSaveRestore.
3234     if (unsigned SP = TLI.getStackPointerRegisterToSaveRestore()) {
3235       Results.push_back(DAG.getCopyToReg(Node->getOperand(0), dl, SP,
3236                                          Node->getOperand(1)));
3237     } else {
3238       Results.push_back(Node->getOperand(0));
3239     }
3240     break;
3241   case ISD::FCOPYSIGN:
3242     Results.push_back(ExpandFCOPYSIGN(Node));
3243     break;
3244   case ISD::FNEG:
3245     // Expand Y = FNEG(X) ->  Y = SUB -0.0, X
3246     Tmp1 = DAG.getConstantFP(-0.0, Node->getValueType(0));
3247     Tmp1 = DAG.getNode(ISD::FSUB, dl, Node->getValueType(0), Tmp1,
3248                        Node->getOperand(0));
3249     Results.push_back(Tmp1);
3250     break;
3251   case ISD::FABS: {
3252     // Expand Y = FABS(X) -> Y = (X >u 0.0) ? X : fneg(X).
3253     EVT VT = Node->getValueType(0);
3254     Tmp1 = Node->getOperand(0);
3255     Tmp2 = DAG.getConstantFP(0.0, VT);
3256     Tmp2 = DAG.getSetCC(dl, TLI.getSetCCResultType(Tmp1.getValueType()),
3257                         Tmp1, Tmp2, ISD::SETUGT);
3258     Tmp3 = DAG.getNode(ISD::FNEG, dl, VT, Tmp1);
3259     Tmp1 = DAG.getNode(ISD::SELECT, dl, VT, Tmp2, Tmp1, Tmp3);
3260     Results.push_back(Tmp1);
3261     break;
3262   }
3263   case ISD::FSQRT:
3264     Results.push_back(ExpandFPLibCall(Node, RTLIB::SQRT_F32, RTLIB::SQRT_F64,
3265                                       RTLIB::SQRT_F80, RTLIB::SQRT_PPCF128));
3266     break;
3267   case ISD::FSIN:
3268     Results.push_back(ExpandFPLibCall(Node, RTLIB::SIN_F32, RTLIB::SIN_F64,
3269                                       RTLIB::SIN_F80, RTLIB::SIN_PPCF128));
3270     break;
3271   case ISD::FCOS:
3272     Results.push_back(ExpandFPLibCall(Node, RTLIB::COS_F32, RTLIB::COS_F64,
3273                                       RTLIB::COS_F80, RTLIB::COS_PPCF128));
3274     break;
3275   case ISD::FLOG:
3276     Results.push_back(ExpandFPLibCall(Node, RTLIB::LOG_F32, RTLIB::LOG_F64,
3277                                       RTLIB::LOG_F80, RTLIB::LOG_PPCF128));
3278     break;
3279   case ISD::FLOG2:
3280     Results.push_back(ExpandFPLibCall(Node, RTLIB::LOG2_F32, RTLIB::LOG2_F64,
3281                                       RTLIB::LOG2_F80, RTLIB::LOG2_PPCF128));
3282     break;
3283   case ISD::FLOG10:
3284     Results.push_back(ExpandFPLibCall(Node, RTLIB::LOG10_F32, RTLIB::LOG10_F64,
3285                                       RTLIB::LOG10_F80, RTLIB::LOG10_PPCF128));
3286     break;
3287   case ISD::FEXP:
3288     Results.push_back(ExpandFPLibCall(Node, RTLIB::EXP_F32, RTLIB::EXP_F64,
3289                                       RTLIB::EXP_F80, RTLIB::EXP_PPCF128));
3290     break;
3291   case ISD::FEXP2:
3292     Results.push_back(ExpandFPLibCall(Node, RTLIB::EXP2_F32, RTLIB::EXP2_F64,
3293                                       RTLIB::EXP2_F80, RTLIB::EXP2_PPCF128));
3294     break;
3295   case ISD::FTRUNC:
3296     Results.push_back(ExpandFPLibCall(Node, RTLIB::TRUNC_F32, RTLIB::TRUNC_F64,
3297                                       RTLIB::TRUNC_F80, RTLIB::TRUNC_PPCF128));
3298     break;
3299   case ISD::FFLOOR:
3300     Results.push_back(ExpandFPLibCall(Node, RTLIB::FLOOR_F32, RTLIB::FLOOR_F64,
3301                                       RTLIB::FLOOR_F80, RTLIB::FLOOR_PPCF128));
3302     break;
3303   case ISD::FCEIL:
3304     Results.push_back(ExpandFPLibCall(Node, RTLIB::CEIL_F32, RTLIB::CEIL_F64,
3305                                       RTLIB::CEIL_F80, RTLIB::CEIL_PPCF128));
3306     break;
3307   case ISD::FRINT:
3308     Results.push_back(ExpandFPLibCall(Node, RTLIB::RINT_F32, RTLIB::RINT_F64,
3309                                       RTLIB::RINT_F80, RTLIB::RINT_PPCF128));
3310     break;
3311   case ISD::FNEARBYINT:
3312     Results.push_back(ExpandFPLibCall(Node, RTLIB::NEARBYINT_F32,
3313                                       RTLIB::NEARBYINT_F64,
3314                                       RTLIB::NEARBYINT_F80,
3315                                       RTLIB::NEARBYINT_PPCF128));
3316     break;
3317   case ISD::FPOWI:
3318     Results.push_back(ExpandFPLibCall(Node, RTLIB::POWI_F32, RTLIB::POWI_F64,
3319                                       RTLIB::POWI_F80, RTLIB::POWI_PPCF128));
3320     break;
3321   case ISD::FPOW:
3322     Results.push_back(ExpandFPLibCall(Node, RTLIB::POW_F32, RTLIB::POW_F64,
3323                                       RTLIB::POW_F80, RTLIB::POW_PPCF128));
3324     break;
3325   case ISD::FDIV:
3326     Results.push_back(ExpandFPLibCall(Node, RTLIB::DIV_F32, RTLIB::DIV_F64,
3327                                       RTLIB::DIV_F80, RTLIB::DIV_PPCF128));
3328     break;
3329   case ISD::FREM:
3330     Results.push_back(ExpandFPLibCall(Node, RTLIB::REM_F32, RTLIB::REM_F64,
3331                                       RTLIB::REM_F80, RTLIB::REM_PPCF128));
3332     break;
3333   case ISD::FMA:
3334     Results.push_back(ExpandFPLibCall(Node, RTLIB::FMA_F32, RTLIB::FMA_F64,
3335                                       RTLIB::FMA_F80, RTLIB::FMA_PPCF128));
3336     break;
3337   case ISD::FP16_TO_FP32:
3338     Results.push_back(ExpandLibCall(RTLIB::FPEXT_F16_F32, Node, false));
3339     break;
3340   case ISD::FP32_TO_FP16:
3341     Results.push_back(ExpandLibCall(RTLIB::FPROUND_F32_F16, Node, false));
3342     break;
3343   case ISD::ConstantFP: {
3344     ConstantFPSDNode *CFP = cast<ConstantFPSDNode>(Node);
3345     // Check to see if this FP immediate is already legal.
3346     // If this is a legal constant, turn it into a TargetConstantFP node.
3347     if (TLI.isFPImmLegal(CFP->getValueAPF(), Node->getValueType(0)))
3348       Results.push_back(SDValue(Node, 0));
3349     else
3350       Results.push_back(ExpandConstantFP(CFP, true, DAG, TLI));
3351     break;
3352   }
3353   case ISD::EHSELECTION: {
3354     unsigned Reg = TLI.getExceptionSelectorRegister();
3355     assert(Reg && "Can't expand to unknown register!");
3356     Results.push_back(DAG.getCopyFromReg(Node->getOperand(1), dl, Reg,
3357                                          Node->getValueType(0)));
3358     Results.push_back(Results[0].getValue(1));
3359     break;
3360   }
3361   case ISD::EXCEPTIONADDR: {
3362     unsigned Reg = TLI.getExceptionAddressRegister();
3363     assert(Reg && "Can't expand to unknown register!");
3364     Results.push_back(DAG.getCopyFromReg(Node->getOperand(0), dl, Reg,
3365                                          Node->getValueType(0)));
3366     Results.push_back(Results[0].getValue(1));
3367     break;
3368   }
3369   case ISD::SUB: {
3370     EVT VT = Node->getValueType(0);
3371     assert(TLI.isOperationLegalOrCustom(ISD::ADD, VT) &&
3372            TLI.isOperationLegalOrCustom(ISD::XOR, VT) &&
3373            "Don't know how to expand this subtraction!");
3374     Tmp1 = DAG.getNode(ISD::XOR, dl, VT, Node->getOperand(1),
3375                DAG.getConstant(APInt::getAllOnesValue(VT.getSizeInBits()), VT));
3376     Tmp1 = DAG.getNode(ISD::ADD, dl, VT, Tmp2, DAG.getConstant(1, VT));
3377     Results.push_back(DAG.getNode(ISD::ADD, dl, VT, Node->getOperand(0), Tmp1));
3378     break;
3379   }
3380   case ISD::UREM:
3381   case ISD::SREM: {
3382     EVT VT = Node->getValueType(0);
3383     SDVTList VTs = DAG.getVTList(VT, VT);
3384     bool isSigned = Node->getOpcode() == ISD::SREM;
3385     unsigned DivOpc = isSigned ? ISD::SDIV : ISD::UDIV;
3386     unsigned DivRemOpc = isSigned ? ISD::SDIVREM : ISD::UDIVREM;
3387     Tmp2 = Node->getOperand(0);
3388     Tmp3 = Node->getOperand(1);
3389     if (TLI.isOperationLegalOrCustom(DivRemOpc, VT) ||
3390         (isDivRemLibcallAvailable(Node, isSigned, TLI) &&
3391          UseDivRem(Node, isSigned, false))) {
3392       Tmp1 = DAG.getNode(DivRemOpc, dl, VTs, Tmp2, Tmp3).getValue(1);
3393     } else if (TLI.isOperationLegalOrCustom(DivOpc, VT)) {
3394       // X % Y -> X-X/Y*Y
3395       Tmp1 = DAG.getNode(DivOpc, dl, VT, Tmp2, Tmp3);
3396       Tmp1 = DAG.getNode(ISD::MUL, dl, VT, Tmp1, Tmp3);
3397       Tmp1 = DAG.getNode(ISD::SUB, dl, VT, Tmp2, Tmp1);
3398     } else if (isSigned)
3399       Tmp1 = ExpandIntLibCall(Node, true,
3400                               RTLIB::SREM_I8,
3401                               RTLIB::SREM_I16, RTLIB::SREM_I32,
3402                               RTLIB::SREM_I64, RTLIB::SREM_I128);
3403     else
3404       Tmp1 = ExpandIntLibCall(Node, false,
3405                               RTLIB::UREM_I8,
3406                               RTLIB::UREM_I16, RTLIB::UREM_I32,
3407                               RTLIB::UREM_I64, RTLIB::UREM_I128);
3408     Results.push_back(Tmp1);
3409     break;
3410   }
3411   case ISD::UDIV:
3412   case ISD::SDIV: {
3413     bool isSigned = Node->getOpcode() == ISD::SDIV;
3414     unsigned DivRemOpc = isSigned ? ISD::SDIVREM : ISD::UDIVREM;
3415     EVT VT = Node->getValueType(0);
3416     SDVTList VTs = DAG.getVTList(VT, VT);
3417     if (TLI.isOperationLegalOrCustom(DivRemOpc, VT) ||
3418         (isDivRemLibcallAvailable(Node, isSigned, TLI) &&
3419          UseDivRem(Node, isSigned, true)))
3420       Tmp1 = DAG.getNode(DivRemOpc, dl, VTs, Node->getOperand(0),
3421                          Node->getOperand(1));
3422     else if (isSigned)
3423       Tmp1 = ExpandIntLibCall(Node, true,
3424                               RTLIB::SDIV_I8,
3425                               RTLIB::SDIV_I16, RTLIB::SDIV_I32,
3426                               RTLIB::SDIV_I64, RTLIB::SDIV_I128);
3427     else
3428       Tmp1 = ExpandIntLibCall(Node, false,
3429                               RTLIB::UDIV_I8,
3430                               RTLIB::UDIV_I16, RTLIB::UDIV_I32,
3431                               RTLIB::UDIV_I64, RTLIB::UDIV_I128);
3432     Results.push_back(Tmp1);
3433     break;
3434   }
3435   case ISD::MULHU:
3436   case ISD::MULHS: {
3437     unsigned ExpandOpcode = Node->getOpcode() == ISD::MULHU ? ISD::UMUL_LOHI :
3438                                                               ISD::SMUL_LOHI;
3439     EVT VT = Node->getValueType(0);
3440     SDVTList VTs = DAG.getVTList(VT, VT);
3441     assert(TLI.isOperationLegalOrCustom(ExpandOpcode, VT) &&
3442            "If this wasn't legal, it shouldn't have been created!");
3443     Tmp1 = DAG.getNode(ExpandOpcode, dl, VTs, Node->getOperand(0),
3444                        Node->getOperand(1));
3445     Results.push_back(Tmp1.getValue(1));
3446     break;
3447   }
3448   case ISD::SDIVREM:
3449   case ISD::UDIVREM:
3450     // Expand into divrem libcall
3451     ExpandDivRemLibCall(Node, Results);
3452     break;
3453   case ISD::MUL: {
3454     EVT VT = Node->getValueType(0);
3455     SDVTList VTs = DAG.getVTList(VT, VT);
3456     // See if multiply or divide can be lowered using two-result operations.
3457     // We just need the low half of the multiply; try both the signed
3458     // and unsigned forms. If the target supports both SMUL_LOHI and
3459     // UMUL_LOHI, form a preference by checking which forms of plain
3460     // MULH it supports.
3461     bool HasSMUL_LOHI = TLI.isOperationLegalOrCustom(ISD::SMUL_LOHI, VT);
3462     bool HasUMUL_LOHI = TLI.isOperationLegalOrCustom(ISD::UMUL_LOHI, VT);
3463     bool HasMULHS = TLI.isOperationLegalOrCustom(ISD::MULHS, VT);
3464     bool HasMULHU = TLI.isOperationLegalOrCustom(ISD::MULHU, VT);
3465     unsigned OpToUse = 0;
3466     if (HasSMUL_LOHI && !HasMULHS) {
3467       OpToUse = ISD::SMUL_LOHI;
3468     } else if (HasUMUL_LOHI && !HasMULHU) {
3469       OpToUse = ISD::UMUL_LOHI;
3470     } else if (HasSMUL_LOHI) {
3471       OpToUse = ISD::SMUL_LOHI;
3472     } else if (HasUMUL_LOHI) {
3473       OpToUse = ISD::UMUL_LOHI;
3474     }
3475     if (OpToUse) {
3476       Results.push_back(DAG.getNode(OpToUse, dl, VTs, Node->getOperand(0),
3477                                     Node->getOperand(1)));
3478       break;
3479     }
3480     Tmp1 = ExpandIntLibCall(Node, false,
3481                             RTLIB::MUL_I8,
3482                             RTLIB::MUL_I16, RTLIB::MUL_I32,
3483                             RTLIB::MUL_I64, RTLIB::MUL_I128);
3484     Results.push_back(Tmp1);
3485     break;
3486   }
3487   case ISD::SADDO:
3488   case ISD::SSUBO: {
3489     SDValue LHS = Node->getOperand(0);
3490     SDValue RHS = Node->getOperand(1);
3491     SDValue Sum = DAG.getNode(Node->getOpcode() == ISD::SADDO ?
3492                               ISD::ADD : ISD::SUB, dl, LHS.getValueType(),
3493                               LHS, RHS);
3494     Results.push_back(Sum);
3495     EVT OType = Node->getValueType(1);
3496
3497     SDValue Zero = DAG.getConstant(0, LHS.getValueType());
3498
3499     //   LHSSign -> LHS >= 0
3500     //   RHSSign -> RHS >= 0
3501     //   SumSign -> Sum >= 0
3502     //
3503     //   Add:
3504     //   Overflow -> (LHSSign == RHSSign) && (LHSSign != SumSign)
3505     //   Sub:
3506     //   Overflow -> (LHSSign != RHSSign) && (LHSSign != SumSign)
3507     //
3508     SDValue LHSSign = DAG.getSetCC(dl, OType, LHS, Zero, ISD::SETGE);
3509     SDValue RHSSign = DAG.getSetCC(dl, OType, RHS, Zero, ISD::SETGE);
3510     SDValue SignsMatch = DAG.getSetCC(dl, OType, LHSSign, RHSSign,
3511                                       Node->getOpcode() == ISD::SADDO ?
3512                                       ISD::SETEQ : ISD::SETNE);
3513
3514     SDValue SumSign = DAG.getSetCC(dl, OType, Sum, Zero, ISD::SETGE);
3515     SDValue SumSignNE = DAG.getSetCC(dl, OType, LHSSign, SumSign, ISD::SETNE);
3516
3517     SDValue Cmp = DAG.getNode(ISD::AND, dl, OType, SignsMatch, SumSignNE);
3518     Results.push_back(Cmp);
3519     break;
3520   }
3521   case ISD::UADDO:
3522   case ISD::USUBO: {
3523     SDValue LHS = Node->getOperand(0);
3524     SDValue RHS = Node->getOperand(1);
3525     SDValue Sum = DAG.getNode(Node->getOpcode() == ISD::UADDO ?
3526                               ISD::ADD : ISD::SUB, dl, LHS.getValueType(),
3527                               LHS, RHS);
3528     Results.push_back(Sum);
3529     Results.push_back(DAG.getSetCC(dl, Node->getValueType(1), Sum, LHS,
3530                                    Node->getOpcode () == ISD::UADDO ?
3531                                    ISD::SETULT : ISD::SETUGT));
3532     break;
3533   }
3534   case ISD::UMULO:
3535   case ISD::SMULO: {
3536     EVT VT = Node->getValueType(0);
3537     EVT WideVT = EVT::getIntegerVT(*DAG.getContext(), VT.getSizeInBits() * 2);
3538     SDValue LHS = Node->getOperand(0);
3539     SDValue RHS = Node->getOperand(1);
3540     SDValue BottomHalf;
3541     SDValue TopHalf;
3542     static const unsigned Ops[2][3] =
3543         { { ISD::MULHU, ISD::UMUL_LOHI, ISD::ZERO_EXTEND },
3544           { ISD::MULHS, ISD::SMUL_LOHI, ISD::SIGN_EXTEND }};
3545     bool isSigned = Node->getOpcode() == ISD::SMULO;
3546     if (TLI.isOperationLegalOrCustom(Ops[isSigned][0], VT)) {
3547       BottomHalf = DAG.getNode(ISD::MUL, dl, VT, LHS, RHS);
3548       TopHalf = DAG.getNode(Ops[isSigned][0], dl, VT, LHS, RHS);
3549     } else if (TLI.isOperationLegalOrCustom(Ops[isSigned][1], VT)) {
3550       BottomHalf = DAG.getNode(Ops[isSigned][1], dl, DAG.getVTList(VT, VT), LHS,
3551                                RHS);
3552       TopHalf = BottomHalf.getValue(1);
3553     } else if (TLI.isTypeLegal(EVT::getIntegerVT(*DAG.getContext(),
3554                                                  VT.getSizeInBits() * 2))) {
3555       LHS = DAG.getNode(Ops[isSigned][2], dl, WideVT, LHS);
3556       RHS = DAG.getNode(Ops[isSigned][2], dl, WideVT, RHS);
3557       Tmp1 = DAG.getNode(ISD::MUL, dl, WideVT, LHS, RHS);
3558       BottomHalf = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, VT, Tmp1,
3559                                DAG.getIntPtrConstant(0));
3560       TopHalf = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, VT, Tmp1,
3561                             DAG.getIntPtrConstant(1));
3562     } else {
3563       // We can fall back to a libcall with an illegal type for the MUL if we
3564       // have a libcall big enough.
3565       // Also, we can fall back to a division in some cases, but that's a big
3566       // performance hit in the general case.
3567       RTLIB::Libcall LC = RTLIB::UNKNOWN_LIBCALL;
3568       if (WideVT == MVT::i16)
3569         LC = RTLIB::MUL_I16;
3570       else if (WideVT == MVT::i32)
3571         LC = RTLIB::MUL_I32;
3572       else if (WideVT == MVT::i64)
3573         LC = RTLIB::MUL_I64;
3574       else if (WideVT == MVT::i128)
3575         LC = RTLIB::MUL_I128;
3576       assert(LC != RTLIB::UNKNOWN_LIBCALL && "Cannot expand this operation!");
3577
3578       // The high part is obtained by SRA'ing all but one of the bits of low
3579       // part.
3580       unsigned LoSize = VT.getSizeInBits();
3581       SDValue HiLHS = DAG.getNode(ISD::SRA, dl, VT, RHS,
3582                                 DAG.getConstant(LoSize-1, TLI.getPointerTy()));
3583       SDValue HiRHS = DAG.getNode(ISD::SRA, dl, VT, LHS,
3584                                 DAG.getConstant(LoSize-1, TLI.getPointerTy()));
3585
3586       // Here we're passing the 2 arguments explicitly as 4 arguments that are
3587       // pre-lowered to the correct types. This all depends upon WideVT not
3588       // being a legal type for the architecture and thus has to be split to
3589       // two arguments.
3590       SDValue Args[] = { LHS, HiLHS, RHS, HiRHS };
3591       SDValue Ret = ExpandLibCall(LC, WideVT, Args, 4, isSigned, dl);
3592       BottomHalf = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, VT, Ret,
3593                                DAG.getIntPtrConstant(0));
3594       TopHalf = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, VT, Ret,
3595                             DAG.getIntPtrConstant(1));
3596     }
3597
3598     if (isSigned) {
3599       Tmp1 = DAG.getConstant(VT.getSizeInBits() - 1,
3600                              TLI.getShiftAmountTy(BottomHalf.getValueType()));
3601       Tmp1 = DAG.getNode(ISD::SRA, dl, VT, BottomHalf, Tmp1);
3602       TopHalf = DAG.getSetCC(dl, TLI.getSetCCResultType(VT), TopHalf, Tmp1,
3603                              ISD::SETNE);
3604     } else {
3605       TopHalf = DAG.getSetCC(dl, TLI.getSetCCResultType(VT), TopHalf,
3606                              DAG.getConstant(0, VT), ISD::SETNE);
3607     }
3608     Results.push_back(BottomHalf);
3609     Results.push_back(TopHalf);
3610     break;
3611   }
3612   case ISD::BUILD_PAIR: {
3613     EVT PairTy = Node->getValueType(0);
3614     Tmp1 = DAG.getNode(ISD::ZERO_EXTEND, dl, PairTy, Node->getOperand(0));
3615     Tmp2 = DAG.getNode(ISD::ANY_EXTEND, dl, PairTy, Node->getOperand(1));
3616     Tmp2 = DAG.getNode(ISD::SHL, dl, PairTy, Tmp2,
3617                        DAG.getConstant(PairTy.getSizeInBits()/2,
3618                                        TLI.getShiftAmountTy(PairTy)));
3619     Results.push_back(DAG.getNode(ISD::OR, dl, PairTy, Tmp1, Tmp2));
3620     break;
3621   }
3622   case ISD::SELECT:
3623     Tmp1 = Node->getOperand(0);
3624     Tmp2 = Node->getOperand(1);
3625     Tmp3 = Node->getOperand(2);
3626     if (Tmp1.getOpcode() == ISD::SETCC) {
3627       Tmp1 = DAG.getSelectCC(dl, Tmp1.getOperand(0), Tmp1.getOperand(1),
3628                              Tmp2, Tmp3,
3629                              cast<CondCodeSDNode>(Tmp1.getOperand(2))->get());
3630     } else {
3631       Tmp1 = DAG.getSelectCC(dl, Tmp1,
3632                              DAG.getConstant(0, Tmp1.getValueType()),
3633                              Tmp2, Tmp3, ISD::SETNE);
3634     }
3635     Results.push_back(Tmp1);
3636     break;
3637   case ISD::BR_JT: {
3638     SDValue Chain = Node->getOperand(0);
3639     SDValue Table = Node->getOperand(1);
3640     SDValue Index = Node->getOperand(2);
3641
3642     EVT PTy = TLI.getPointerTy();
3643
3644     const TargetData &TD = *TLI.getTargetData();
3645     unsigned EntrySize =
3646       DAG.getMachineFunction().getJumpTableInfo()->getEntrySize(TD);
3647
3648     Index = DAG.getNode(ISD::MUL, dl, PTy,
3649                         Index, DAG.getConstant(EntrySize, PTy));
3650     SDValue Addr = DAG.getNode(ISD::ADD, dl, PTy, Index, Table);
3651
3652     EVT MemVT = EVT::getIntegerVT(*DAG.getContext(), EntrySize * 8);
3653     SDValue LD = DAG.getExtLoad(ISD::SEXTLOAD, dl, PTy, Chain, Addr,
3654                                 MachinePointerInfo::getJumpTable(), MemVT,
3655                                 false, false, 0);
3656     Addr = LD;
3657     if (TM.getRelocationModel() == Reloc::PIC_) {
3658       // For PIC, the sequence is:
3659       // BRIND(load(Jumptable + index) + RelocBase)
3660       // RelocBase can be JumpTable, GOT or some sort of global base.
3661       Addr = DAG.getNode(ISD::ADD, dl, PTy, Addr,
3662                           TLI.getPICJumpTableRelocBase(Table, DAG));
3663     }
3664     Tmp1 = DAG.getNode(ISD::BRIND, dl, MVT::Other, LD.getValue(1), Addr);
3665     Results.push_back(Tmp1);
3666     break;
3667   }
3668   case ISD::BRCOND:
3669     // Expand brcond's setcc into its constituent parts and create a BR_CC
3670     // Node.
3671     Tmp1 = Node->getOperand(0);
3672     Tmp2 = Node->getOperand(1);
3673     if (Tmp2.getOpcode() == ISD::SETCC) {
3674       Tmp1 = DAG.getNode(ISD::BR_CC, dl, MVT::Other,
3675                          Tmp1, Tmp2.getOperand(2),
3676                          Tmp2.getOperand(0), Tmp2.getOperand(1),
3677                          Node->getOperand(2));
3678     } else {
3679       // We test only the i1 bit.  Skip the AND if UNDEF.
3680       Tmp3 = (Tmp2.getOpcode() == ISD::UNDEF) ? Tmp2 :
3681         DAG.getNode(ISD::AND, dl, Tmp2.getValueType(), Tmp2,
3682                     DAG.getConstant(1, Tmp2.getValueType()));
3683       Tmp1 = DAG.getNode(ISD::BR_CC, dl, MVT::Other, Tmp1,
3684                          DAG.getCondCode(ISD::SETNE), Tmp3,
3685                          DAG.getConstant(0, Tmp3.getValueType()),
3686                          Node->getOperand(2));
3687     }
3688     Results.push_back(Tmp1);
3689     break;
3690   case ISD::SETCC: {
3691     Tmp1 = Node->getOperand(0);
3692     Tmp2 = Node->getOperand(1);
3693     Tmp3 = Node->getOperand(2);
3694     LegalizeSetCCCondCode(Node->getValueType(0), Tmp1, Tmp2, Tmp3, dl);
3695
3696     // If we expanded the SETCC into an AND/OR, return the new node
3697     if (Tmp2.getNode() == 0) {
3698       Results.push_back(Tmp1);
3699       break;
3700     }
3701
3702     // Otherwise, SETCC for the given comparison type must be completely
3703     // illegal; expand it into a SELECT_CC.
3704     EVT VT = Node->getValueType(0);
3705     Tmp1 = DAG.getNode(ISD::SELECT_CC, dl, VT, Tmp1, Tmp2,
3706                        DAG.getConstant(1, VT), DAG.getConstant(0, VT), Tmp3);
3707     Results.push_back(Tmp1);
3708     break;
3709   }
3710   case ISD::SELECT_CC: {
3711     Tmp1 = Node->getOperand(0);   // LHS
3712     Tmp2 = Node->getOperand(1);   // RHS
3713     Tmp3 = Node->getOperand(2);   // True
3714     Tmp4 = Node->getOperand(3);   // False
3715     SDValue CC = Node->getOperand(4);
3716
3717     LegalizeSetCCCondCode(TLI.getSetCCResultType(Tmp1.getValueType()),
3718                           Tmp1, Tmp2, CC, dl);
3719
3720     assert(!Tmp2.getNode() && "Can't legalize SELECT_CC with legal condition!");
3721     Tmp2 = DAG.getConstant(0, Tmp1.getValueType());
3722     CC = DAG.getCondCode(ISD::SETNE);
3723     Tmp1 = DAG.getNode(ISD::SELECT_CC, dl, Node->getValueType(0), Tmp1, Tmp2,
3724                        Tmp3, Tmp4, CC);
3725     Results.push_back(Tmp1);
3726     break;
3727   }
3728   case ISD::BR_CC: {
3729     Tmp1 = Node->getOperand(0);              // Chain
3730     Tmp2 = Node->getOperand(2);              // LHS
3731     Tmp3 = Node->getOperand(3);              // RHS
3732     Tmp4 = Node->getOperand(1);              // CC
3733
3734     LegalizeSetCCCondCode(TLI.getSetCCResultType(Tmp2.getValueType()),
3735                           Tmp2, Tmp3, Tmp4, dl);
3736     assert(LastCALLSEQ.size() == 1 && "branch inside CALLSEQ_BEGIN/END?");
3737     setLastCALLSEQ(DAG.getEntryNode());
3738
3739     assert(!Tmp3.getNode() && "Can't legalize BR_CC with legal condition!");
3740     Tmp3 = DAG.getConstant(0, Tmp2.getValueType());
3741     Tmp4 = DAG.getCondCode(ISD::SETNE);
3742     Tmp1 = DAG.getNode(ISD::BR_CC, dl, Node->getValueType(0), Tmp1, Tmp4, Tmp2,
3743                        Tmp3, Node->getOperand(4));
3744     Results.push_back(Tmp1);
3745     break;
3746   }
3747   case ISD::GLOBAL_OFFSET_TABLE:
3748   case ISD::GlobalAddress:
3749   case ISD::GlobalTLSAddress:
3750   case ISD::ExternalSymbol:
3751   case ISD::ConstantPool:
3752   case ISD::JumpTable:
3753   case ISD::INTRINSIC_W_CHAIN:
3754   case ISD::INTRINSIC_WO_CHAIN:
3755   case ISD::INTRINSIC_VOID:
3756     // FIXME: Custom lowering for these operations shouldn't return null!
3757     for (unsigned i = 0, e = Node->getNumValues(); i != e; ++i)
3758       Results.push_back(SDValue(Node, i));
3759     break;
3760   }
3761 }
3762 void SelectionDAGLegalize::PromoteNode(SDNode *Node,
3763                                        SmallVectorImpl<SDValue> &Results) {
3764   EVT OVT = Node->getValueType(0);
3765   if (Node->getOpcode() == ISD::UINT_TO_FP ||
3766       Node->getOpcode() == ISD::SINT_TO_FP ||
3767       Node->getOpcode() == ISD::SETCC) {
3768     OVT = Node->getOperand(0).getValueType();
3769   }
3770   EVT NVT = TLI.getTypeToPromoteTo(Node->getOpcode(), OVT);
3771   DebugLoc dl = Node->getDebugLoc();
3772   SDValue Tmp1, Tmp2, Tmp3;
3773   switch (Node->getOpcode()) {
3774   case ISD::CTTZ:
3775   case ISD::CTLZ:
3776   case ISD::CTPOP:
3777     // Zero extend the argument.
3778     Tmp1 = DAG.getNode(ISD::ZERO_EXTEND, dl, NVT, Node->getOperand(0));
3779     // Perform the larger operation.
3780     Tmp1 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1);
3781     if (Node->getOpcode() == ISD::CTTZ) {
3782       //if Tmp1 == sizeinbits(NVT) then Tmp1 = sizeinbits(Old VT)
3783       Tmp2 = DAG.getSetCC(dl, TLI.getSetCCResultType(NVT),
3784                           Tmp1, DAG.getConstant(NVT.getSizeInBits(), NVT),
3785                           ISD::SETEQ);
3786       Tmp1 = DAG.getNode(ISD::SELECT, dl, NVT, Tmp2,
3787                           DAG.getConstant(OVT.getSizeInBits(), NVT), Tmp1);
3788     } else if (Node->getOpcode() == ISD::CTLZ) {
3789       // Tmp1 = Tmp1 - (sizeinbits(NVT) - sizeinbits(Old VT))
3790       Tmp1 = DAG.getNode(ISD::SUB, dl, NVT, Tmp1,
3791                           DAG.getConstant(NVT.getSizeInBits() -
3792                                           OVT.getSizeInBits(), NVT));
3793     }
3794     Results.push_back(DAG.getNode(ISD::TRUNCATE, dl, OVT, Tmp1));
3795     break;
3796   case ISD::BSWAP: {
3797     unsigned DiffBits = NVT.getSizeInBits() - OVT.getSizeInBits();
3798     Tmp1 = DAG.getNode(ISD::ZERO_EXTEND, dl, NVT, Node->getOperand(0));
3799     Tmp1 = DAG.getNode(ISD::BSWAP, dl, NVT, Tmp1);
3800     Tmp1 = DAG.getNode(ISD::SRL, dl, NVT, Tmp1,
3801                           DAG.getConstant(DiffBits, TLI.getShiftAmountTy(NVT)));
3802     Results.push_back(Tmp1);
3803     break;
3804   }
3805   case ISD::FP_TO_UINT:
3806   case ISD::FP_TO_SINT:
3807     Tmp1 = PromoteLegalFP_TO_INT(Node->getOperand(0), Node->getValueType(0),
3808                                  Node->getOpcode() == ISD::FP_TO_SINT, dl);
3809     Results.push_back(Tmp1);
3810     break;
3811   case ISD::UINT_TO_FP:
3812   case ISD::SINT_TO_FP:
3813     Tmp1 = PromoteLegalINT_TO_FP(Node->getOperand(0), Node->getValueType(0),
3814                                  Node->getOpcode() == ISD::SINT_TO_FP, dl);
3815     Results.push_back(Tmp1);
3816     break;
3817   case ISD::AND:
3818   case ISD::OR:
3819   case ISD::XOR: {
3820     unsigned ExtOp, TruncOp;
3821     if (OVT.isVector()) {
3822       ExtOp   = ISD::BITCAST;
3823       TruncOp = ISD::BITCAST;
3824     } else {
3825       assert(OVT.isInteger() && "Cannot promote logic operation");
3826       ExtOp   = ISD::ANY_EXTEND;
3827       TruncOp = ISD::TRUNCATE;
3828     }
3829     // Promote each of the values to the new type.
3830     Tmp1 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(0));
3831     Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(1));
3832     // Perform the larger operation, then convert back
3833     Tmp1 = DAG.getNode(Node->getOpcode(), dl, NVT, Tmp1, Tmp2);
3834     Results.push_back(DAG.getNode(TruncOp, dl, OVT, Tmp1));
3835     break;
3836   }
3837   case ISD::SELECT: {
3838     unsigned ExtOp, TruncOp;
3839     if (Node->getValueType(0).isVector()) {
3840       ExtOp   = ISD::BITCAST;
3841       TruncOp = ISD::BITCAST;
3842     } else if (Node->getValueType(0).isInteger()) {
3843       ExtOp   = ISD::ANY_EXTEND;
3844       TruncOp = ISD::TRUNCATE;
3845     } else {
3846       ExtOp   = ISD::FP_EXTEND;
3847       TruncOp = ISD::FP_ROUND;
3848     }
3849     Tmp1 = Node->getOperand(0);
3850     // Promote each of the values to the new type.
3851     Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(1));
3852     Tmp3 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(2));
3853     // Perform the larger operation, then round down.
3854     Tmp1 = DAG.getNode(ISD::SELECT, dl, NVT, Tmp1, Tmp2, Tmp3);
3855     if (TruncOp != ISD::FP_ROUND)
3856       Tmp1 = DAG.getNode(TruncOp, dl, Node->getValueType(0), Tmp1);
3857     else
3858       Tmp1 = DAG.getNode(TruncOp, dl, Node->getValueType(0), Tmp1,
3859                          DAG.getIntPtrConstant(0));
3860     Results.push_back(Tmp1);
3861     break;
3862   }
3863   case ISD::VECTOR_SHUFFLE: {
3864     SmallVector<int, 8> Mask;
3865     cast<ShuffleVectorSDNode>(Node)->getMask(Mask);
3866
3867     // Cast the two input vectors.
3868     Tmp1 = DAG.getNode(ISD::BITCAST, dl, NVT, Node->getOperand(0));
3869     Tmp2 = DAG.getNode(ISD::BITCAST, dl, NVT, Node->getOperand(1));
3870
3871     // Convert the shuffle mask to the right # elements.
3872     Tmp1 = ShuffleWithNarrowerEltType(NVT, OVT, dl, Tmp1, Tmp2, Mask);
3873     Tmp1 = DAG.getNode(ISD::BITCAST, dl, OVT, Tmp1);
3874     Results.push_back(Tmp1);
3875     break;
3876   }
3877   case ISD::SETCC: {
3878     unsigned ExtOp = ISD::FP_EXTEND;
3879     if (NVT.isInteger()) {
3880       ISD::CondCode CCCode =
3881         cast<CondCodeSDNode>(Node->getOperand(2))->get();
3882       ExtOp = isSignedIntSetCC(CCCode) ? ISD::SIGN_EXTEND : ISD::ZERO_EXTEND;
3883     }
3884     Tmp1 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(0));
3885     Tmp2 = DAG.getNode(ExtOp, dl, NVT, Node->getOperand(1));
3886     Results.push_back(DAG.getNode(ISD::SETCC, dl, Node->getValueType(0),
3887                                   Tmp1, Tmp2, Node->getOperand(2)));
3888     break;
3889   }
3890   }
3891 }
3892
3893 // SelectionDAG::Legalize - This is the entry point for the file.
3894 //
3895 void SelectionDAG::Legalize() {
3896   /// run - This is the main entry point to this class.
3897   ///
3898   SelectionDAGLegalize(*this).LegalizeDAG();
3899 }