Convert more uses of XXXRegisterClass to &XXXRegClass. No functional change since...

[oota-llvm.git] / lib / Target / ARM / ARMFastISel.cpp
diff --git a/lib/Target/ARM/ARMFastISel.cpp b/lib/Target/ARM/ARMFastISel.cpp

index 818b20286af8c1f35d0703106f0fbc8c38055179..de3e430b44071856ce30196a0fb37313bf6036ba 100644 (file)
--- a/lib/Target/ARM/ARMFastISel.cpp
+++ b/lib/Target/ARM/ARMFastISel.cpp
@@ -16,7 +16,6 @@
  #include "ARM.h"
  #include "ARMBaseInstrInfo.h"
  #include "ARMCallingConv.h"
-#include "ARMRegisterInfo.h"
  #include "ARMTargetMachine.h"
  #include "ARMSubtarget.h"
  #include "ARMConstantPoolValue.h"
@@ -911,8 +910,9 @@ void ARMFastISel::ARMSimplifyAddress(Address &Addr, EVT VT, bool useAM3) {
    // put the alloca address into a register, set the base type back to
    // register and continue. This should almost never happen.
    if (needsLowering && Addr.BaseType == Address::FrameIndexBase) {
-    const TargetRegisterClass *RC = isThumb2 ? ARM::tGPRRegisterClass
-                                             : ARM::GPRRegisterClass;
+    const TargetRegisterClass *RC = isThumb2 ?
+      (const TargetRegisterClass*)&ARM::tGPRRegClass :
+      (const TargetRegisterClass*)&ARM::GPRRegClass;
      unsigned ResultReg = createResultReg(RC);
      unsigned Opc = isThumb2 ? ARM::t2ADDri : ARM::ADDri;
      AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
@@ -1006,7 +1006,7 @@ bool ARMFastISel::ARMEmitLoad(EVT VT, unsigned &ResultReg, Address &Addr,
            useAM3 = true;
          }
        }
-      RC = ARM::GPRRegisterClass;
+      RC = &ARM::GPRRegClass;
        break;
      case MVT::i16:
        if (isThumb2) {
@@ -1018,7 +1018,7 @@ bool ARMFastISel::ARMEmitLoad(EVT VT, unsigned &ResultReg, Address &Addr,
          Opc = isZExt ? ARM::LDRH : ARM::LDRSH;
          useAM3 = true;
        }
-      RC = ARM::GPRRegisterClass;
+      RC = &ARM::GPRRegClass;
        break;
      case MVT::i32:
        if (isThumb2) {
@@ -1029,7 +1029,7 @@ bool ARMFastISel::ARMEmitLoad(EVT VT, unsigned &ResultReg, Address &Addr,
        } else {
          Opc = ARM::LDRi12;
        }
-      RC = ARM::GPRRegisterClass;
+      RC = &ARM::GPRRegClass;
        break;
      case MVT::f32:
        if (!Subtarget->hasVFP2()) return false;
@@ -1038,7 +1038,7 @@ bool ARMFastISel::ARMEmitLoad(EVT VT, unsigned &ResultReg, Address &Addr,
          needVMOV = true;
          VT = MVT::i32;
          Opc = isThumb2 ? ARM::t2LDRi12 : ARM::LDRi12;
-        RC = ARM::GPRRegisterClass;
+        RC = &ARM::GPRRegClass;
        } else {
          Opc = ARM::VLDRS;
          RC = TLI.getRegClassFor(VT);
@@ -1107,8 +1107,9 @@ bool ARMFastISel::ARMEmitStore(EVT VT, unsigned SrcReg, Address &Addr,
      // This is mostly going to be Neon/vector support.
      default: return false;
      case MVT::i1: {
-      unsigned Res = createResultReg(isThumb2 ? ARM::tGPRRegisterClass :
-                                               ARM::GPRRegisterClass);
+      unsigned Res = createResultReg(isThumb2 ?
+        (const TargetRegisterClass*)&ARM::tGPRRegClass :
+        (const TargetRegisterClass*)&ARM::GPRRegClass);
        unsigned Opc = isThumb2 ? ARM::t2ANDri : ARM::ANDri;
        AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                                TII.get(Opc), Res)
@@ -1384,7 +1385,10 @@ bool ARMFastISel::ARMEmitCmp(const Value *Src1Value, const Value *Src2Value,
          SrcVT == MVT::i1) {
        const APInt &CIVal = ConstInt->getValue();
        Imm = (isZExt) ? (int)CIVal.getZExtValue() : (int)CIVal.getSExtValue();
-      if (Imm < 0) {
+      // For INT_MIN/LONG_MIN (i.e., 0x80000000) we need to use a cmp, rather
+      // then a cmn, because there is no way to represent 2147483648 as a 
+      // signed 32-bit int.
+      if (Imm < 0 && Imm != (int)0x80000000) {
          isNegativeImm = true;
          Imm = -Imm;
        }
@@ -1475,7 +1479,6 @@ bool ARMFastISel::ARMEmitCmp(const Value *Src1Value, const Value *Src2Value,
  
  bool ARMFastISel::SelectCmp(const Instruction *I) {
    const CmpInst *CI = cast<CmpInst>(I);
-  Type *Ty = CI->getOperand(0)->getType();
  
    // Get the compare predicate.
    ARMCC::CondCodes ARMPred = getComparePred(CI->getPredicate());
@@ -1490,16 +1493,16 @@ bool ARMFastISel::SelectCmp(const Instruction *I) {
    // Now set a register based on the comparison. Explicitly set the predicates
    // here.
    unsigned MovCCOpc = isThumb2 ? ARM::t2MOVCCi : ARM::MOVCCi;
-  const TargetRegisterClass *RC = isThumb2 ? ARM::rGPRRegisterClass
-                                           : ARM::GPRRegisterClass;
+  const TargetRegisterClass *RC = isThumb2 ?
+    (const TargetRegisterClass*)&ARM::rGPRRegClass :
+    (const TargetRegisterClass*)&ARM::GPRRegClass;
    unsigned DestReg = createResultReg(RC);
    Constant *Zero = ConstantInt::get(Type::getInt32Ty(*Context), 0);
    unsigned ZeroReg = TargetMaterializeConstant(Zero);
-  bool isFloat = (Ty->isFloatTy() || Ty->isDoubleTy());
-  unsigned CondReg = isFloat ? ARM::FPSCR : ARM::CPSR;
+  // ARMEmitCmp emits a FMSTAT when necessary, so it's always safe to use CPSR.
    BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL, TII.get(MovCCOpc), DestReg)
            .addReg(ZeroReg).addImm(1)
-          .addImm(ARMPred).addReg(CondReg);
+          .addImm(ARMPred).addReg(ARM::CPSR);
  
    UpdateValueMap(I, DestReg);
    return true;
@@ -1516,7 +1519,7 @@ bool ARMFastISel::SelectFPExt(const Instruction *I) {
    unsigned Op = getRegForValue(V);
    if (Op == 0) return false;
  
-  unsigned Result = createResultReg(ARM::DPRRegisterClass);
+  unsigned Result = createResultReg(&ARM::DPRRegClass);
    AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                            TII.get(ARM::VCVTDS), Result)
                    .addReg(Op));
@@ -1535,7 +1538,7 @@ bool ARMFastISel::SelectFPTrunc(const Instruction *I) {
    unsigned Op = getRegForValue(V);
    if (Op == 0) return false;
  
-  unsigned Result = createResultReg(ARM::SPRRegisterClass);
+  unsigned Result = createResultReg(&ARM::SPRRegClass);
    AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                            TII.get(ARM::VCVTSD), Result)
                    .addReg(Op));
@@ -1851,6 +1854,48 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
    CCState CCInfo(CC, false, *FuncInfo.MF, TM, ArgLocs, *Context);
    CCInfo.AnalyzeCallOperands(ArgVTs, ArgFlags, CCAssignFnForCall(CC, false));
  
+  // Check that we can handle all of the arguments. If we can't, then bail out
+  // now before we add code to the MBB.
+  for (unsigned i = 0, e = ArgLocs.size(); i != e; ++i) {
+    CCValAssign &VA = ArgLocs[i];
+    MVT ArgVT = ArgVTs[VA.getValNo()];
+
+    // We don't handle NEON/vector parameters yet.
+    if (ArgVT.isVector() || ArgVT.getSizeInBits() > 64)
+      return false;
+
+    // Now copy/store arg to correct locations.
+    if (VA.isRegLoc() && !VA.needsCustom()) {
+      continue;
+    } else if (VA.needsCustom()) {
+      // TODO: We need custom lowering for vector (v2f64) args.
+      if (VA.getLocVT() != MVT::f64 ||
+          // TODO: Only handle register args for now.
+          !VA.isRegLoc() || !ArgLocs[++i].isRegLoc())
+        return false;
+    } else {
+      switch (static_cast<EVT>(ArgVT).getSimpleVT().SimpleTy) {
+      default:
+        return false;
+      case MVT::i1:
+      case MVT::i8:
+      case MVT::i16:
+      case MVT::i32:
+        break;
+      case MVT::f32:
+        if (!Subtarget->hasVFP2())
+          return false;
+        break;
+      case MVT::f64:
+        if (!Subtarget->hasVFP2())
+          return false;
+        break;
+      }
+    }
+  }
+
+  // At the point, we are able to handle the call's arguments in fast isel.
+
    // Get a count of how many bytes are to be pushed on the stack.
    NumBytes = CCInfo.getNextStackOffset();
  
@@ -1866,9 +1911,8 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
      unsigned Arg = ArgRegs[VA.getValNo()];
      MVT ArgVT = ArgVTs[VA.getValNo()];
  
-    // We don't handle NEON/vector parameters yet.
-    if (ArgVT.isVector() || ArgVT.getSizeInBits() > 64)
-      return false;
+    assert((!ArgVT.isVector() && ArgVT.getSizeInBits() <= 64) &&
+           "We don't handle NEON/vector parameters yet.");
  
      // Handle arg promotion, etc.
      switch (VA.getLocInfo()) {
@@ -1908,12 +1952,13 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
        RegArgs.push_back(VA.getLocReg());
      } else if (VA.needsCustom()) {
        // TODO: We need custom lowering for vector (v2f64) args.
-      if (VA.getLocVT() != MVT::f64) return false;
+      assert(VA.getLocVT() == MVT::f64 &&
+             "Custom lowering for v2f64 args not available");
  
        CCValAssign &NextVA = ArgLocs[++i];
  
-      // TODO: Only handle register args for now.
-      if(!(VA.isRegLoc() && NextVA.isRegLoc())) return false;
+      assert(VA.isRegLoc() && NextVA.isRegLoc() &&
+             "We only handle register args!");
  
        AddOptionalDefs(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                                TII.get(ARM::VMOVRRD), VA.getLocReg())
@@ -1929,9 +1974,11 @@ bool ARMFastISel::ProcessCallArgs(SmallVectorImpl<Value*> &Args,
        Addr.Base.Reg = ARM::SP;
        Addr.Offset = VA.getLocMemOffset();
  
-      if (!ARMEmitStore(ArgVT, Arg, Addr)) return false;
+      bool EmitRet = ARMEmitStore(ArgVT, Arg, Addr); (void)EmitRet;
+      assert(EmitRet && "Could not emit a store for argument!");
      }
    }
+
    return true;
  }
  
@@ -2067,13 +2114,10 @@ bool ARMFastISel::SelectRet(const Instruction *I) {
  }
  
  unsigned ARMFastISel::ARMSelectCallOp(const GlobalValue *GV) {
-
-  // iOS needs the r9 versions of the opcodes.
-  bool isiOS = Subtarget->isTargetIOS();
    if (isThumb2) {
-    return isiOS ? ARM::tBLr9 : ARM::tBL;
+    return ARM::tBL;
    } else  {
-    return isiOS ? ARM::BLr9 : ARM::BL;
+    return ARM::BL;
    }
  }
  
@@ -2132,11 +2176,10 @@ bool ARMFastISel::ARMEmitLibcall(const Instruction *I, RTLIB::Libcall Call) {
    if (!ProcessCallArgs(Args, ArgRegs, ArgVTs, ArgFlags, RegArgs, CC, NumBytes))
      return false;
  
-  // Issue the call, BLr9 for iOS, BL otherwise.
-  // TODO: Turn this into the table of arm call ops.
+  // Issue the call.
    MachineInstrBuilder MIB;
    unsigned CallOpc = ARMSelectCallOp(NULL);
-  if(isThumb2)
+  if (isThumb2)
      // Explicitly adding the predicate here.
      MIB = AddDefaultPred(BuildMI(*FuncInfo.MBB, FuncInfo.InsertPt, DL,
                           TII.get(CallOpc)))
@@ -2258,8 +2301,7 @@ bool ARMFastISel::SelectCall(const Instruction *I,
    if (!ProcessCallArgs(Args, ArgRegs, ArgVTs, ArgFlags, RegArgs, CC, NumBytes))
      return false;
  
-  // Issue the call, BLr9 for iOS, BL otherwise.
-  // TODO: Turn this into the table of arm call ops.
+  // Issue the call.
    MachineInstrBuilder MIB;
    unsigned CallOpc = ARMSelectCallOp(GV);
    // Explicitly adding the predicate here.
@@ -2305,7 +2347,8 @@ bool ARMFastISel::ARMIsMemCpySmall(uint64_t Len) {
    return Len <= 16;
  }
  
-bool ARMFastISel::ARMTryEmitSmallMemCpy(Address Dest, Address Src, uint64_t Len) {
+bool ARMFastISel::ARMTryEmitSmallMemCpy(Address Dest, Address Src,
+                                        uint64_t Len) {
    // Make sure we don't bloat code by inlining very large memcpy's.
    if (!ARMIsMemCpySmall(Len))
      return false;
@@ -2594,7 +2637,7 @@ bool ARMFastISel::TryToFoldLoad(MachineInstr *MI, unsigned OpNo,
  }
  
  namespace llvm {
-  llvm::FastISel *ARM::createFastISel(FunctionLoweringInfo &funcInfo) {
+  FastISel *ARM::createFastISel(FunctionLoweringInfo &funcInfo) {
      // Completely untested on non-iOS.
      const TargetMachine &TM = funcInfo.MF->getTarget();