Trailing whitespace

[oota-llvm.git] / lib / Target / ARM / ARMFastISel.cpp
diff --git a/lib/Target/ARM/ARMFastISel.cpp b/lib/Target/ARM/ARMFastISel.cpp

index eeaaf7efab30423f3bfc2ac7e9b64432f0695f1c..3eac44bc8d7098a08c87ac6277f4ac97069f15a0 100644 (file)
--- a/lib/Target/ARM/ARMFastISel.cpp
+++ b/lib/Target/ARM/ARMFastISel.cpp
@@ -132,6 +132,7 @@ class ARMFastISel : public FastISel {
      bool SelectSRem(const Instruction *I);
      bool SelectCall(const Instruction *I);
      bool SelectSelect(const Instruction *I);
+    bool SelectRet(const Instruction *I);
  
      // Utility routines.
    private:
@@ -448,7 +449,7 @@ unsigned ARMFastISel::ARMMaterializeInt(const Constant *C, EVT VT) {
      AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                              TII.get(ARM::LDRcp), DestReg)
                      .addConstantPoolIndex(Idx)
-                    .addReg(0).addImm(0));
+                    .addImm(0));
  
    return DestReg;
  }
@@ -683,9 +684,9 @@ bool ARMFastISel::ARMComputeRegOffset(const Value *Obj, unsigned &Base,
  }
  
  void ARMFastISel::ARMSimplifyRegOffset(unsigned &Base, int &Offset, EVT VT) {
-  
+
    assert(VT.isSimple() && "Non-simple types are invalid here!");
-  
+
    bool needsLowering = false;
    switch (VT.getSimpleVT().SimpleTy) {
      default:
@@ -703,7 +704,7 @@ void ARMFastISel::ARMSimplifyRegOffset(unsigned &Base, int &Offset, EVT VT) {
        needsLowering = ((Offset & 0xff) != Offset);
        break;
    }
-  
+
    // Since the offset is too large for the load/store instruction
    // get the reg+offset into a register.
    if (needsLowering) {
@@ -745,11 +746,11 @@ bool ARMFastISel::ARMEmitLoad(EVT VT, unsigned &ResultReg,
        RC = ARM::GPRRegisterClass;
        break;
      case MVT::i8:
-      Opc = isThumb ? ARM::t2LDRBi12 : ARM::LDRB;
+      Opc = isThumb ? ARM::t2LDRBi12 : ARM::LDRBi12;
        RC = ARM::GPRRegisterClass;
        break;
      case MVT::i32:
-      Opc = isThumb ? ARM::t2LDRi12 : ARM::LDR;
+      Opc = isThumb ? ARM::t2LDRi12 : ARM::LDRi12;
        RC = ARM::GPRRegisterClass;
        break;
      case MVT::f32:
@@ -765,24 +766,17 @@ bool ARMFastISel::ARMEmitLoad(EVT VT, unsigned &ResultReg,
    }
  
    ResultReg = createResultReg(RC);
-  
+
    ARMSimplifyRegOffset(Base, Offset, VT);
-  
+
    // addrmode5 output depends on the selection dag addressing dividing the
    // offset by 4 that it then later multiplies. Do this here as well.
    if (isFloat)
      Offset /= 4;
-  
-  // The thumb and floating point instructions both take 2 operands, ARM takes
-  // another register.
-  if (isFloat || isThumb)
-    AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
-                            TII.get(Opc), ResultReg)
-                    .addReg(Base).addImm(Offset));
-  else
-    AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
-                            TII.get(Opc), ResultReg)
-                    .addReg(Base).addReg(0).addImm(Offset));
+
+  AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
+                          TII.get(Opc), ResultReg)
+                  .addReg(Base).addImm(Offset));
    return true;
  }
  
@@ -836,12 +830,12 @@ bool ARMFastISel::ARMEmitStore(EVT VT, unsigned SrcReg,
    }
  
    ARMSimplifyRegOffset(Base, Offset, VT);
-  
+
    // addrmode5 output depends on the selection dag addressing dividing the
    // offset by 4 that it then later multiplies. Do this here as well.
    if (isFloat)
      Offset /= 4;
-  
+
    // The thumb addressing mode has operands swapped from the arm addressing
    // mode, the floating point one only has two operands.
    if (isFloat || isThumb)
@@ -1248,12 +1242,12 @@ bool ARMFastISel::FastEmitExtend(ISD::NodeType Opc, EVT DstVT, unsigned Src,
                                   EVT SrcVT, unsigned &ResultReg) {
    unsigned RR = FastEmit_r(SrcVT.getSimpleVT(), DstVT.getSimpleVT(), Opc,
                             Src, /*TODO: Kill=*/false);
-  
+
    if (RR != 0) {
      ResultReg = RR;
      return true;
    } else
-    return false;                                   
+    return false;
  }
  
  // This is largely taken directly from CCAssignFnForNode - we don't support
@@ -1263,8 +1257,12 @@ CCAssignFn *ARMFastISel::CCAssignFnForCall(CallingConv::ID CC, bool Return) {
    switch (CC) {
    default:
      llvm_unreachable("Unsupported calling convention");
-  case CallingConv::C:
    case CallingConv::Fast:
+    // Ignore fastcc. Silence compiler warnings.
+    (void)RetFastCC_ARM_APCS;
+    (void)FastCC_ARM_APCS;
+    // Fallthrough
+  case CallingConv::C:
      // Use target triple & subtarget features to do actual dispatch.
      if (Subtarget->isAAPCS_ABI()) {
        if (Subtarget->hasVFP2() &&
@@ -1309,6 +1307,10 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
      unsigned Arg = ArgRegs[VA.getValNo()];
      EVT ArgVT = ArgVTs[VA.getValNo()];
  
+    // We don't handle NEON parameters yet.
+    if (VA.getLocVT().isVector() && VA.getLocVT().getSizeInBits() > 64)
+      return false;
+
      // Handle arg promotion, etc.
      switch (VA.getLocInfo()) {
        case CCValAssign::Full: break;
@@ -1329,9 +1331,6 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
          break;
        }
        case CCValAssign::AExt: {
-        // We don't handle NEON or f64 parameters yet.
-        if (VA.getLocVT().isVector() && VA.getLocVT().getSizeInBits() >= 64)
-          return false;
          bool Emitted = FastEmitExtend(ISD::ANY_EXTEND, VA.getLocVT(),
                                           Arg, ArgVT, Arg);
          if (!Emitted)
@@ -1366,7 +1365,7 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
      } else if (VA.needsCustom()) {
        // TODO: We need custom lowering for vector (v2f64) args.
        if (VA.getLocVT() != MVT::f64) return false;
-      
+
        CCValAssign &NextVA = ArgLocs[++i];
  
        // TODO: Only handle register args for now.
@@ -1419,7 +1418,7 @@ bool ARMFastISel::FinishCall(EVT RetVT, SmallVectorImpl<unsigned> &UsedRegs,
  
        UsedRegs.push_back(RVLocs[0].getLocReg());
        UsedRegs.push_back(RVLocs[1].getLocReg());
-      
+
        // Finally update the result.
        UpdateValueMap(I, ResultReg);
      } else {
@@ -1440,6 +1439,69 @@ bool ARMFastISel::FinishCall(EVT RetVT, SmallVectorImpl<unsigned> &UsedRegs,
    return true;
  }
  
+bool ARMFastISel::SelectRet(const Instruction *I) {
+  const ReturnInst *Ret = cast<ReturnInst>(I);
+  const Function &F = *I->getParent()->getParent();
+
+  if (!FuncInfo.CanLowerReturn)
+    return false;
+
+  if (F.isVarArg())
+    return false;
+
+  CallingConv::ID CC = F.getCallingConv();
+  if (Ret->getNumOperands() > 0) {
+    SmallVector<ISD::OutputArg, 4> Outs;
+    GetReturnInfo(F.getReturnType(), F.getAttributes().getRetAttributes(),
+                  Outs, TLI);
+
+    // Analyze operands of the call, assigning locations to each operand.
+    SmallVector<CCValAssign, 16> ValLocs;
+    CCState CCInfo(CC, F.isVarArg(), TM, ValLocs, I->getContext());
+    CCInfo.AnalyzeReturn(Outs, CCAssignFnForCall(CC, true /* is Ret */));
+
+    const Value *RV = Ret->getOperand(0);
+    unsigned Reg = getRegForValue(RV);
+    if (Reg == 0)
+      return false;
+
+    // Only handle a single return value for now.
+    if (ValLocs.size() != 1)
+      return false;
+
+    CCValAssign &VA = ValLocs[0];
+
+    // Don't bother handling odd stuff for now.
+    if (VA.getLocInfo() != CCValAssign::Full)
+      return false;
+    // Only handle register returns for now.
+    if (!VA.isRegLoc())
+      return false;
+    // TODO: For now, don't try to handle cases where getLocInfo()
+    // says Full but the types don't match.
+    if (VA.getValVT() != TLI.getValueType(RV->getType()))
+      return false;
+
+    // Make the copy.
+    unsigned SrcReg = Reg + VA.getValNo();
+    unsigned DstReg = VA.getLocReg();
+    const TargetRegisterClass* SrcRC = MRI.getRegClass(SrcReg);
+    // Avoid a cross-class copy. This is very unlikely.
+    if (!SrcRC->contains(DstReg))
+      return false;
+    BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(TargetOpcode::COPY),
+            DstReg).addReg(SrcReg);
+
+    // Mark the register as live out of the function.
+    MRI.addLiveOut(VA.getLocReg());
+  }
+
+  unsigned RetOpc = isThumb ? ARM::tBX_RET : ARM::BX_RET;
+  AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
+                          TII.get(RetOpc)));
+  return true;
+}
+
  // A quick function that will emit a call for a named libcall in F with the
  // vector of passed arguments for the Instruction in I. We can assume that we
  // can emit a call for any libcall we can produce. This is an abridged version
@@ -1667,6 +1729,8 @@ bool ARMFastISel::TargetSelectInstruction(const Instruction *I) {
        return SelectCall(I);
      case Instruction::Select:
        return SelectSelect(I);
+    case Instruction::Ret:
+      return SelectRet(I);
      default: break;
    }
    return false;