[Statepoints] Use Indirect operands for spill slots

[oota-llvm.git] / lib / CodeGen / TargetLoweringBase.cpp
diff --git a/lib/CodeGen/TargetLoweringBase.cpp b/lib/CodeGen/TargetLoweringBase.cpp

index ecfd65931574ea7a8500f8d6491ca75b08832db6..36a31c9d6461dc62d4784c6db96cec1ffb86ef8d 100644 (file)
--- a/lib/CodeGen/TargetLoweringBase.cpp
+++ b/lib/CodeGen/TargetLoweringBase.cpp
@@ -247,13 +247,9 @@ static void InitLibcallNames(const char **Names, const Triple &TT) {
    Names[RTLIB::FPROUND_F80_F64] = "__truncxfdf2";
    Names[RTLIB::FPROUND_F128_F64] = "__trunctfdf2";
    Names[RTLIB::FPROUND_PPCF128_F64] = "__trunctfdf2";
-  Names[RTLIB::FPTOSINT_F32_I8] = "__fixsfqi";
-  Names[RTLIB::FPTOSINT_F32_I16] = "__fixsfhi";
    Names[RTLIB::FPTOSINT_F32_I32] = "__fixsfsi";
    Names[RTLIB::FPTOSINT_F32_I64] = "__fixsfdi";
    Names[RTLIB::FPTOSINT_F32_I128] = "__fixsfti";
-  Names[RTLIB::FPTOSINT_F64_I8] = "__fixdfqi";
-  Names[RTLIB::FPTOSINT_F64_I16] = "__fixdfhi";
    Names[RTLIB::FPTOSINT_F64_I32] = "__fixdfsi";
    Names[RTLIB::FPTOSINT_F64_I64] = "__fixdfdi";
    Names[RTLIB::FPTOSINT_F64_I128] = "__fixdfti";
@@ -266,13 +262,9 @@ static void InitLibcallNames(const char **Names, const Triple &TT) {
    Names[RTLIB::FPTOSINT_PPCF128_I32] = "__fixtfsi";
    Names[RTLIB::FPTOSINT_PPCF128_I64] = "__fixtfdi";
    Names[RTLIB::FPTOSINT_PPCF128_I128] = "__fixtfti";
-  Names[RTLIB::FPTOUINT_F32_I8] = "__fixunssfqi";
-  Names[RTLIB::FPTOUINT_F32_I16] = "__fixunssfhi";
    Names[RTLIB::FPTOUINT_F32_I32] = "__fixunssfsi";
    Names[RTLIB::FPTOUINT_F32_I64] = "__fixunssfdi";
    Names[RTLIB::FPTOUINT_F32_I128] = "__fixunssfti";
-  Names[RTLIB::FPTOUINT_F64_I8] = "__fixunsdfqi";
-  Names[RTLIB::FPTOUINT_F64_I16] = "__fixunsdfhi";
    Names[RTLIB::FPTOUINT_F64_I32] = "__fixunsdfsi";
    Names[RTLIB::FPTOUINT_F64_I64] = "__fixunsdfdi";
    Names[RTLIB::FPTOUINT_F64_I128] = "__fixunsdfti";
@@ -501,10 +493,6 @@ RTLIB::Libcall RTLIB::getFPROUND(EVT OpVT, EVT RetVT) {
  /// UNKNOWN_LIBCALL if there is none.
  RTLIB::Libcall RTLIB::getFPTOSINT(EVT OpVT, EVT RetVT) {
    if (OpVT == MVT::f32) {
-    if (RetVT == MVT::i8)
-      return FPTOSINT_F32_I8;
-    if (RetVT == MVT::i16)
-      return FPTOSINT_F32_I16;
      if (RetVT == MVT::i32)
        return FPTOSINT_F32_I32;
      if (RetVT == MVT::i64)
@@ -512,10 +500,6 @@ RTLIB::Libcall RTLIB::getFPTOSINT(EVT OpVT, EVT RetVT) {
      if (RetVT == MVT::i128)
        return FPTOSINT_F32_I128;
    } else if (OpVT == MVT::f64) {
-    if (RetVT == MVT::i8)
-      return FPTOSINT_F64_I8;
-    if (RetVT == MVT::i16)
-      return FPTOSINT_F64_I16;
      if (RetVT == MVT::i32)
        return FPTOSINT_F64_I32;
      if (RetVT == MVT::i64)
@@ -551,10 +535,6 @@ RTLIB::Libcall RTLIB::getFPTOSINT(EVT OpVT, EVT RetVT) {
  /// UNKNOWN_LIBCALL if there is none.
  RTLIB::Libcall RTLIB::getFPTOUINT(EVT OpVT, EVT RetVT) {
    if (OpVT == MVT::f32) {
-    if (RetVT == MVT::i8)
-      return FPTOUINT_F32_I8;
-    if (RetVT == MVT::i16)
-      return FPTOUINT_F32_I16;
      if (RetVT == MVT::i32)
        return FPTOUINT_F32_I32;
      if (RetVT == MVT::i64)
@@ -562,10 +542,6 @@ RTLIB::Libcall RTLIB::getFPTOUINT(EVT OpVT, EVT RetVT) {
      if (RetVT == MVT::i128)
        return FPTOUINT_F32_I128;
    } else if (OpVT == MVT::f64) {
-    if (RetVT == MVT::i8)
-      return FPTOUINT_F64_I8;
-    if (RetVT == MVT::i16)
-      return FPTOUINT_F64_I16;
      if (RetVT == MVT::i32)
        return FPTOUINT_F64_I32;
      if (RetVT == MVT::i64)
@@ -758,17 +734,13 @@ TargetLoweringBase::TargetLoweringBase(const TargetMachine &tm) : TM(tm) {
    SelectIsExpensive = false;
    HasMultipleConditionRegisters = false;
    HasExtractBitsInsn = false;
-  IntDivIsCheap = false;
    FsqrtIsCheap = false;
-  Pow2SDivIsCheap = false;
    JumpIsExpensive = JumpIsExpensiveOverride;
    PredictableSelectIsExpensive = false;
    MaskAndBranchFoldingIsLegal = false;
    EnableExtLdPromotion = false;
    HasFloatingPointExceptions = true;
    StackPointerRegisterToSaveRestore = 0;
-  ExceptionPointerRegister = 0;
-  ExceptionSelectorRegister = 0;
    BooleanContents = UndefinedBooleanContent;
    BooleanFloatContents = UndefinedBooleanContent;
    BooleanVectorContents = UndefinedBooleanContent;
@@ -778,6 +750,7 @@ TargetLoweringBase::TargetLoweringBase(const TargetMachine &tm) : TM(tm) {
    MinFunctionAlignment = 0;
    PrefFunctionAlignment = 0;
    PrefLoopAlignment = 0;
+  GatherAllAliasesMaxDepth = 6;
    MinStackArgumentAlignment = 1;
    InsertFencesForAtomic = false;
    MinimumJumpTableEntries = 4;
@@ -814,6 +787,8 @@ void TargetLoweringBase::initActions() {
      setOperationAction(ISD::CONCAT_VECTORS, VT, Expand);
      setOperationAction(ISD::FMINNUM, VT, Expand);
      setOperationAction(ISD::FMAXNUM, VT, Expand);
+    setOperationAction(ISD::FMINNAN, VT, Expand);
+    setOperationAction(ISD::FMAXNAN, VT, Expand);
      setOperationAction(ISD::FMAD, VT, Expand);
      setOperationAction(ISD::SMIN, VT, Expand);
      setOperationAction(ISD::SMAX, VT, Expand);
@@ -828,6 +803,8 @@ void TargetLoweringBase::initActions() {
      setOperationAction(ISD::SMULO, VT, Expand);
      setOperationAction(ISD::UMULO, VT, Expand);
  
+    setOperationAction(ISD::BITREVERSE, VT, Expand);
+    
      // These library functions default to expand.
      setOperationAction(ISD::FROUND, VT, Expand);
  
@@ -838,11 +815,17 @@ void TargetLoweringBase::initActions() {
        setOperationAction(ISD::SIGN_EXTEND_VECTOR_INREG, VT, Expand);
        setOperationAction(ISD::ZERO_EXTEND_VECTOR_INREG, VT, Expand);
      }
+
+    // For most targets @llvm.get.dynamic.area.offest just returns 0.
+    setOperationAction(ISD::GET_DYNAMIC_AREA_OFFSET, VT, Expand);
    }
  
    // Most targets ignore the @llvm.prefetch intrinsic.
    setOperationAction(ISD::PREFETCH, MVT::Other, Expand);
  
+  // Most targets also ignore the @llvm.readcyclecounter intrinsic.
+  setOperationAction(ISD::READCYCLECOUNTER, MVT::i64, Expand);
+
    // ConstantFP nodes default to expand.  Targets can either change this to
    // Legal, in which case all fp constants are legal, or use isFPImmLegal()
    // to optimize expansions for certain constants.
@@ -1111,6 +1094,19 @@ MachineBasicBlock*
  TargetLoweringBase::emitPatchPoint(MachineInstr *MI,
                                     MachineBasicBlock *MBB) const {
    MachineFunction &MF = *MI->getParent()->getParent();
+  MachineFrameInfo &MFI = *MF.getFrameInfo();
+
+  // We're handling multiple types of operands here:
+  // PATCHPOINT MetaArgs - live-in, read only, direct
+  // STATEPOINT Deopt Spill - live-through, read only, indirect
+  // STATEPOINT Deopt Alloca - live-through, read only, direct
+  // (We're currently conservative and mark the deopt slots read/write in
+  // practice.) 
+  // STATEPOINT GC Spill - live-through, read/write, indirect
+  // STATEPOINT GC Alloca - live-through, read/write, direct
+  // The live-in vs live-through is handled already (the live through ones are
+  // all stack slots), but we need to handle the different type of stackmap
+  // operands and memory effects here.
  
    // MI changes inside this loop as we grow operands.
    for(unsigned OperIdx = 0; OperIdx != MI->getNumOperands(); ++OperIdx) {
@@ -1126,10 +1122,24 @@ TargetLoweringBase::emitPatchPoint(MachineInstr *MI,
      // Copy operands before the frame-index.
      for (unsigned i = 0; i < OperIdx; ++i)
        MIB.addOperand(MI->getOperand(i));
-    // Add frame index operands: direct-mem-ref tag, #FI, offset.
-    MIB.addImm(StackMaps::DirectMemRefOp);
-    MIB.addOperand(MI->getOperand(OperIdx));
-    MIB.addImm(0);
+    // Add frame index operands recognized by stackmaps.cpp
+    if (MFI.isStatepointSpillSlotObjectIndex(FI)) {
+      // indirect-mem-ref tag, size, #FI, offset.
+      // Used for spills inserted by StatepointLowering.  This codepath is not
+      // used for patchpoints/stackmaps at all, for these spilling is done via
+      // foldMemoryOperand callback only.
+      assert(MI->getOpcode() == TargetOpcode::STATEPOINT && "sanity");
+      MIB.addImm(StackMaps::IndirectMemRefOp);
+      MIB.addImm(MFI.getObjectSize(FI));
+      MIB.addOperand(MI->getOperand(OperIdx));
+      MIB.addImm(0);
+    } else {
+      // direct-mem-ref tag, #FI, offset.
+      // Used by patchpoint, and direct alloca arguments to statepoints
+      MIB.addImm(StackMaps::DirectMemRefOp);
+      MIB.addOperand(MI->getOperand(OperIdx));
+      MIB.addImm(0);
+    }
      // Copy the operands after the frame index.
      for (unsigned i = OperIdx + 1; i != MI->getNumOperands(); ++i)
        MIB.addOperand(MI->getOperand(i));
@@ -1139,7 +1149,6 @@ TargetLoweringBase::emitPatchPoint(MachineInstr *MI,
      assert(MIB->mayLoad() && "Folded a stackmap use to a non-load!");
  
      // Add a new memory operand for this FI.
-    const MachineFrameInfo &MFI = *MF.getFrameInfo();
      assert(MFI.getObjectOffset(FI) != -1);
  
      unsigned Flags = MachineMemOperand::MOLoad;
@@ -1148,8 +1157,8 @@ TargetLoweringBase::emitPatchPoint(MachineInstr *MI,
        Flags |= MachineMemOperand::MOVolatile;
      }
      MachineMemOperand *MMO = MF.getMachineMemOperand(
-        MachinePointerInfo::getFixedStack(FI), Flags,
-        TM.getDataLayout()->getPointerSize(), MFI.getObjectAlignment(FI));
+        MachinePointerInfo::getFixedStack(MF, FI), Flags,
+        MF.getDataLayout().getPointerSize(), MFI.getObjectAlignment(FI));
      MIB->addMemOperand(MF, MMO);
  
      // Replace the instruction and update the operand index.
@@ -1274,20 +1283,14 @@ void TargetLoweringBase::computeRegisterProperties(
      ValueTypeActions.setTypeAction(MVT::f32, TypeSoftenFloat);
    }
  
+  // Decide how to handle f16. If the target does not have native f16 support,
+  // promote it to f32, because there are no f16 library calls (except for
+  // conversions).
    if (!isTypeLegal(MVT::f16)) {
-    // If the target has native f32 support, promote f16 operations to f32.  If
-    // f32 is not supported, generate soft float library calls.
-    if (isTypeLegal(MVT::f32)) {
-      NumRegistersForVT[MVT::f16] = NumRegistersForVT[MVT::f32];
-      RegisterTypeForVT[MVT::f16] = RegisterTypeForVT[MVT::f32];
-      TransformToType[MVT::f16] = MVT::f32;
-      ValueTypeActions.setTypeAction(MVT::f16, TypePromoteFloat);
-    } else {
-      NumRegistersForVT[MVT::f16] = NumRegistersForVT[MVT::i16];
-      RegisterTypeForVT[MVT::f16] = RegisterTypeForVT[MVT::i16];
-      TransformToType[MVT::f16] = MVT::i16;
-      ValueTypeActions.setTypeAction(MVT::f16, TypeSoftenFloat);
-    }
+    NumRegistersForVT[MVT::f16] = NumRegistersForVT[MVT::f32];
+    RegisterTypeForVT[MVT::f16] = RegisterTypeForVT[MVT::f32];
+    TransformToType[MVT::f16] = MVT::f32;
+    ValueTypeActions.setTypeAction(MVT::f16, TypePromoteFloat);
    }
  
    // Loop over all of the vector value types to see which need transformations.
@@ -1528,6 +1531,29 @@ unsigned TargetLoweringBase::getByValTypeAlignment(Type *Ty,
    return DL.getABITypeAlignment(Ty);
  }
  
+bool TargetLoweringBase::allowsMemoryAccess(LLVMContext &Context,
+                                            const DataLayout &DL, EVT VT,
+                                            unsigned AddrSpace,
+                                            unsigned Alignment,
+                                            bool *Fast) const {
+  // Check if the specified alignment is sufficient based on the data layout.
+  // TODO: While using the data layout works in practice, a better solution
+  // would be to implement this check directly (make this a virtual function).
+  // For example, the ABI alignment may change based on software platform while
+  // this function should only be affected by hardware implementation.
+  Type *Ty = VT.getTypeForEVT(Context);
+  if (Alignment >= DL.getABITypeAlignment(Ty)) {
+    // Assume that an access that meets the ABI-specified alignment is fast.
+    if (Fast != nullptr)
+      *Fast = true;
+    return true;
+  }
+  
+  // This is a misaligned access.
+  return allowsMisalignedMemoryAccesses(VT, AddrSpace, Alignment, Fast);
+}
+
+
  //===----------------------------------------------------------------------===//
  //  TargetTransformInfo Helpers
  //===----------------------------------------------------------------------===//
@@ -1546,6 +1572,11 @@ int TargetLoweringBase::InstructionOpcodeToISD(unsigned Opcode) const {
    case Invoke:         return 0;
    case Resume:         return 0;
    case Unreachable:    return 0;
+  case CleanupRet:     return 0;
+  case CatchRet:       return 0;
+  case CatchPad:       return 0;
+  case CatchSwitch:    return 0;
+  case CleanupPad:     return 0;
    case Add:            return ISD::ADD;
    case FAdd:           return ISD::FADD;
    case Sub:            return ISD::SUB;
@@ -1603,13 +1634,13 @@ int TargetLoweringBase::InstructionOpcodeToISD(unsigned Opcode) const {
    llvm_unreachable("Unknown instruction type encountered!");
  }
  
-std::pair<unsigned, MVT>
+std::pair<int, MVT>
  TargetLoweringBase::getTypeLegalizationCost(const DataLayout &DL,
                                              Type *Ty) const {
    LLVMContext &C = Ty->getContext();
    EVT MTy = getValueType(DL, Ty);
  
-  unsigned Cost = 1;
+  int Cost = 1;
    // We keep legalizing the type until we find a legal kind. We assume that
    // the only operation that costs anything is the split. After splitting
    // we need to handle two types.
@@ -1622,11 +1653,28 @@ TargetLoweringBase::getTypeLegalizationCost(const DataLayout &DL,
      if (LK.first == TypeSplitVector || LK.first == TypeExpandInteger)
        Cost *= 2;
  
+    // Do not loop with f128 type.
+    if (MTy == LK.second)
+      return std::make_pair(Cost, MTy.getSimpleVT());
+
      // Keep legalizing the type.
      MTy = LK.second;
    }
  }
  
+Value *TargetLoweringBase::getSafeStackPointerLocation(IRBuilder<> &IRB) const {
+  if (!TM.getTargetTriple().isAndroid())
+    return nullptr;
+
+  // Android provides a libc function to retrieve the address of the current
+  // thread's unsafe stack pointer.
+  Module *M = IRB.GetInsertBlock()->getParent()->getParent();
+  Type *StackPtrTy = Type::getInt8PtrTy(M->getContext());
+  Value *Fn = M->getOrInsertFunction("__safestack_pointer_address",
+                                     StackPtrTy->getPointerTo(0), nullptr);
+  return IRB.CreateCall(Fn);
+}
+
  //===----------------------------------------------------------------------===//
  //  Loop Strength Reduction hooks
  //===----------------------------------------------------------------------===//