Mutate TargetLowering::shouldExpandAtomicRMWInIR to specifically dictate how AtomicRM...

author JF Bastien <jfb@google.com>

Wed, 4 Mar 2015 15:47:57 +0000 (15:47 +0000)

committer JF Bastien <jfb@google.com>

Wed, 4 Mar 2015 15:47:57 +0000 (15:47 +0000)
author JF Bastien <jfb@google.com>
Wed, 4 Mar 2015 15:47:57 +0000 (15:47 +0000)
committer JF Bastien <jfb@google.com>
Wed, 4 Mar 2015 15:47:57 +0000 (15:47 +0000)
diff --git a/include/llvm/Target/TargetLowering.h b/include/llvm/Target/TargetLowering.h

index 34587cdd8fd60d4746158289d38650fd388ca9e3..a56fdf9f2223aecf8757103897a2435489fd208b 100644 (file)
--- a/include/llvm/Target/TargetLowering.h
+++ b/include/llvm/Target/TargetLowering.h
@@ -123,6 +123,18 @@ public:
                            // mask (ex: x86 blends).
    };
  
+  /// Enum that specifies what a AtomicRMWInst is expanded to, if at all. Exists
+  /// because different targets have different levels of support for these
+  /// atomic RMW instructions, and also have different options w.r.t. what they should
+  /// expand to.
+  enum class AtomicRMWExpansionKind {
+    None,      // Don't expand the instruction.
+    LLSC,      // Expand the instruction into loadlinked/storeconditional; used
+               // by ARM/AArch64. Implies `hasLoadLinkedStoreConditional`
+               // returns true.
+    CmpXChg,   // Expand the instruction into cmpxchg; used by at least X86.
+  };
+
    static ISD::NodeType getExtendForContent(BooleanContent Content) {
      switch (Content) {
      case UndefinedBooleanContent:
@@ -1064,10 +1076,11 @@ public:
    /// (through emitLoadLinked()).
    virtual bool shouldExpandAtomicLoadInIR(LoadInst *LI) const { return false; }
  
-  /// Returns true if the given AtomicRMW should be expanded by the
-  /// IR-level AtomicExpand pass into a loop using LoadLinked/StoreConditional.
-  virtual bool shouldExpandAtomicRMWInIR(AtomicRMWInst *RMWI) const {
-    return false;
+  /// Returns how the IR-level AtomicExpand pass should expand the given
+  /// AtomicRMW, if at all. Default is to never expand.
+  virtual AtomicRMWExpansionKind
+  shouldExpandAtomicRMWInIR(AtomicRMWInst *) const {
+    return AtomicRMWExpansionKind::None;
    }
  
    /// On some platforms, an AtomicRMW that never actually modifies the value
diff --git a/lib/CodeGen/AtomicExpandPass.cpp b/lib/CodeGen/AtomicExpandPass.cpp

index 4b64be053dfd31fa928895369e86ff7dab515cfa..fa17108b2a8eb36fcbe24289154c965b7b308c46 100644 (file)
--- a/lib/CodeGen/AtomicExpandPass.cpp
+++ b/lib/CodeGen/AtomicExpandPass.cpp
@@ -48,7 +48,7 @@ namespace {
      bool expandAtomicLoadToLL(LoadInst *LI);
      bool expandAtomicLoadToCmpXchg(LoadInst *LI);
      bool expandAtomicStore(StoreInst *SI);
-    bool expandAtomicRMW(AtomicRMWInst *AI);
+    bool tryExpandAtomicRMW(AtomicRMWInst *AI);
      bool expandAtomicRMWToLLSC(AtomicRMWInst *AI);
      bool expandAtomicRMWToCmpXchg(AtomicRMWInst *AI);
      bool expandAtomicCmpXchg(AtomicCmpXchgInst *CI);
@@ -135,9 +135,12 @@ bool AtomicExpand::runOnFunction(Function &F) {
        // - into a load if it is idempotent
        // - into a Cmpxchg/LL-SC loop otherwise
        // we try them in that order.
-      MadeChange |=
-          (isIdempotentRMW(RMWI) && simplifyIdempotentRMW(RMWI)) ||
-          (TLI->shouldExpandAtomicRMWInIR(RMWI) && expandAtomicRMW(RMWI));
+
+      if (isIdempotentRMW(RMWI) && simplifyIdempotentRMW(RMWI)) {
+        MadeChange = true;
+      } else {
+        MadeChange |= tryExpandAtomicRMW(RMWI);
+      }
      } else if (CASI && TLI->hasLoadLinkedStoreConditional()) {
        MadeChange |= expandAtomicCmpXchg(CASI);
      }
@@ -211,7 +214,7 @@ bool AtomicExpand::expandAtomicStore(StoreInst *SI) {
    // atomic if implemented as a native store. So we replace them by an
    // atomic swap, that can be implemented for example as a ldrex/strex on ARM
    // or lock cmpxchg8/16b on X86, as these are atomic for larger sizes.
-  // It is the responsibility of the target to only return true in
+  // It is the responsibility of the target to only signal expansion via
    // shouldExpandAtomicRMW in cases where this is required and possible.
    IRBuilder<> Builder(SI);
    AtomicRMWInst *AI =
@@ -220,14 +223,26 @@ bool AtomicExpand::expandAtomicStore(StoreInst *SI) {
    SI->eraseFromParent();
  
    // Now we have an appropriate swap instruction, lower it as usual.
-  return expandAtomicRMW(AI);
+  return tryExpandAtomicRMW(AI);
  }
  
-bool AtomicExpand::expandAtomicRMW(AtomicRMWInst *AI) {
-  if (TLI->hasLoadLinkedStoreConditional())
+bool AtomicExpand::tryExpandAtomicRMW(AtomicRMWInst *AI) {
+  switch (TLI->shouldExpandAtomicRMWInIR(AI)) {
+  case TargetLoweringBase::AtomicRMWExpansionKind::None:
+    return false;
+  case TargetLoweringBase::AtomicRMWExpansionKind::LLSC: {
+    assert(TLI->hasLoadLinkedStoreConditional() &&
+           "TargetLowering requested we expand AtomicRMW instruction into "
+           "load-linked/store-conditional combos, but such instructions aren't "
+           "supported");
+
      return expandAtomicRMWToLLSC(AI);
-  else
+  }
+  case TargetLoweringBase::AtomicRMWExpansionKind::CmpXChg: {
      return expandAtomicRMWToCmpXchg(AI);
+  }
+  }
+  llvm_unreachable("Unhandled case in tryExpandAtomicRMW");
  }
  
  /// Emit IR to implement the given atomicrmw operation on values in registers,
diff --git a/lib/Target/AArch64/AArch64ISelLowering.cpp b/lib/Target/AArch64/AArch64ISelLowering.cpp

index d108c09c1625917775acf83e77645aa6ee910f33..effb0c0d18c6722ef3fd72eed9162cf92c6825f7 100644 (file)
--- a/lib/Target/AArch64/AArch64ISelLowering.cpp
+++ b/lib/Target/AArch64/AArch64ISelLowering.cpp
@@ -8755,9 +8755,11 @@ bool AArch64TargetLowering::shouldExpandAtomicLoadInIR(LoadInst *LI) const {
  }
  
  // For the real atomic operations, we have ldxr/stxr up to 128 bits,
-bool AArch64TargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {
+TargetLoweringBase::AtomicRMWExpansionKind
+AArch64TargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {
    unsigned Size = AI->getType()->getPrimitiveSizeInBits();
-  return Size <= 128;
+  return Size <= 128 ? AtomicRMWExpansionKind::LLSC
+                     : AtomicRMWExpansionKind::None;
  }
  
  bool AArch64TargetLowering::hasLoadLinkedStoreConditional() const {
diff --git a/lib/Target/AArch64/AArch64ISelLowering.h b/lib/Target/AArch64/AArch64ISelLowering.h

index 4ad859184402a7adaa99936e1eda57b9d39e7742..e4e3709f354935ae8f99554dac106e0699855cb4 100644 (file)
--- a/lib/Target/AArch64/AArch64ISelLowering.h
+++ b/lib/Target/AArch64/AArch64ISelLowering.h
@@ -335,7 +335,8 @@ public:
  
    bool shouldExpandAtomicLoadInIR(LoadInst *LI) const override;
    bool shouldExpandAtomicStoreInIR(StoreInst *SI) const override;
-  bool shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
+  TargetLoweringBase::AtomicRMWExpansionKind
+  shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
  
    bool useLoadStackGuardNode() const override;
    TargetLoweringBase::LegalizeTypeAction
diff --git a/lib/Target/ARM/ARMISelLowering.cpp b/lib/Target/ARM/ARMISelLowering.cpp

index 76b540a0876f1127e7878e3183c9ae9819e1bb7e..7694378b48087049acf2fe830b1ab6d4b494d167 100644 (file)
--- a/lib/Target/ARM/ARMISelLowering.cpp
+++ b/lib/Target/ARM/ARMISelLowering.cpp
@@ -11199,9 +11199,12 @@ bool ARMTargetLowering::shouldExpandAtomicLoadInIR(LoadInst *LI) const {
  
  // For the real atomic operations, we have ldrex/strex up to 32 bits,
  // and up to 64 bits on the non-M profiles
-bool ARMTargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {
+TargetLoweringBase::AtomicRMWExpansionKind
+ARMTargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {
    unsigned Size = AI->getType()->getPrimitiveSizeInBits();
-  return Size <= (Subtarget->isMClass() ? 32U : 64U);
+  return (Size <= (Subtarget->isMClass() ? 32U : 64U))
+             ? AtomicRMWExpansionKind::LLSC
+             : AtomicRMWExpansionKind::None;
  }
  
  // This has so far only been implemented for MachO.
diff --git a/lib/Target/ARM/ARMISelLowering.h b/lib/Target/ARM/ARMISelLowering.h

index ec1407d6c42569a204946860d71c76677383fe35..7fd2725b7e56f640445033b15bd810eb68f6e349 100644 (file)
--- a/lib/Target/ARM/ARMISelLowering.h
+++ b/lib/Target/ARM/ARMISelLowering.h
@@ -404,7 +404,8 @@ namespace llvm {
  
      bool shouldExpandAtomicLoadInIR(LoadInst *LI) const override;
      bool shouldExpandAtomicStoreInIR(StoreInst *SI) const override;
-    bool shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
+    TargetLoweringBase::AtomicRMWExpansionKind
+    shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
  
      bool useLoadStackGuardNode() const override;
  
diff --git a/lib/Target/X86/X86ISelLowering.cpp b/lib/Target/X86/X86ISelLowering.cpp

index abc05d4e42dc534df1166a4ddc2ea85ec9f53875..e5af7293b0effe568ff87857a878ab213712b4d7 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.cpp
+++ b/lib/Target/X86/X86ISelLowering.cpp
@@ -16398,14 +16398,17 @@ bool X86TargetLowering::shouldExpandAtomicLoadInIR(LoadInst *LI) const {
    return needsCmpXchgNb(PTy->getElementType());
  }
  
-bool X86TargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {
+TargetLoweringBase::AtomicRMWExpansionKind
+X86TargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {
    unsigned NativeWidth = Subtarget->is64Bit() ? 64 : 32;
    const Type *MemType = AI->getType();
  
    // If the operand is too big, we must see if cmpxchg8/16b is available
    // and default to library calls otherwise.
-  if (MemType->getPrimitiveSizeInBits() > NativeWidth)
-    return needsCmpXchgNb(MemType);
+  if (MemType->getPrimitiveSizeInBits() > NativeWidth) {
+    return needsCmpXchgNb(MemType) ? AtomicRMWExpansionKind::CmpXChg
+                                   : AtomicRMWExpansionKind::None;
+  }
  
    AtomicRMWInst::BinOp Op = AI->getOperation();
    switch (Op) {
@@ -16415,13 +16418,14 @@ bool X86TargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {
    case AtomicRMWInst::Add:
    case AtomicRMWInst::Sub:
      // It's better to use xadd, xsub or xchg for these in all cases.
-    return false;
+    return AtomicRMWExpansionKind::None;
    case AtomicRMWInst::Or:
    case AtomicRMWInst::And:
    case AtomicRMWInst::Xor:
      // If the atomicrmw's result isn't actually used, we can just add a "lock"
      // prefix to a normal instruction for these operations.
-    return !AI->use_empty();
+    return !AI->use_empty() ? AtomicRMWExpansionKind::CmpXChg
+                            : AtomicRMWExpansionKind::None;
    case AtomicRMWInst::Nand:
    case AtomicRMWInst::Max:
    case AtomicRMWInst::Min:
@@ -16429,7 +16433,7 @@ bool X86TargetLowering::shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const {
    case AtomicRMWInst::UMin:
      // These always require a non-trivial set of data operations on x86. We must
      // use a cmpxchg loop.
-    return true;
+    return AtomicRMWExpansionKind::CmpXChg;
    }
  }
  
diff --git a/lib/Target/X86/X86ISelLowering.h b/lib/Target/X86/X86ISelLowering.h

index 510520acaf582e90c039730e97794b8f6cbf69cc..f913daabbaea78e483da98c5ef67fd0f8e2020de 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.h
+++ b/lib/Target/X86/X86ISelLowering.h
@@ -991,7 +991,8 @@ namespace llvm {
  
      bool shouldExpandAtomicLoadInIR(LoadInst *SI) const override;
      bool shouldExpandAtomicStoreInIR(StoreInst *SI) const override;
-    bool shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
+    TargetLoweringBase::AtomicRMWExpansionKind
+    shouldExpandAtomicRMWInIR(AtomicRMWInst *AI) const override;
  
      LoadInst *
      lowerIdempotentRMWIntoFencedLoad(AtomicRMWInst *AI) const override;
author	JF Bastien <jfb@google.com>
	Wed, 4 Mar 2015 15:47:57 +0000 (15:47 +0000)
committer	JF Bastien <jfb@google.com>
	Wed, 4 Mar 2015 15:47:57 +0000 (15:47 +0000)
include/llvm/Target/TargetLowering.h		patch \| blob \| history
lib/CodeGen/AtomicExpandPass.cpp		patch \| blob \| history
lib/Target/AArch64/AArch64ISelLowering.cpp		patch \| blob \| history
lib/Target/AArch64/AArch64ISelLowering.h		patch \| blob \| history
lib/Target/ARM/ARMISelLowering.cpp		patch \| blob \| history
lib/Target/ARM/ARMISelLowering.h		patch \| blob \| history
lib/Target/X86/X86ISelLowering.cpp		patch \| blob \| history
lib/Target/X86/X86ISelLowering.h		patch \| blob \| history