[IndVars] Extract out eliminateIdentitySCEV, NFC

[oota-llvm.git] / lib / CodeGen / CodeGenPrepare.cpp
diff --git a/lib/CodeGen/CodeGenPrepare.cpp b/lib/CodeGen/CodeGenPrepare.cpp

index 6e7f525736d07ad1e61c8c8d3e3e2bbef41e0566..c4c97ff0a3d0425e36e09b24f86e28691ba1d678 100644 (file)
--- a/lib/CodeGen/CodeGenPrepare.cpp
+++ b/lib/CodeGen/CodeGenPrepare.cpp
@@ -114,16 +114,13 @@ typedef DenseMap<Instruction *, TypeIsSExt> InstrToOrigTy;
  class TypePromotionTransaction;
  
    class CodeGenPrepare : public FunctionPass {
-    /// TLI - Keep a pointer of a TargetLowering to consult for determining
-    /// transformation profitability.
      const TargetMachine *TM;
      const TargetLowering *TLI;
      const TargetTransformInfo *TTI;
      const TargetLibraryInfo *TLInfo;
  
-    /// CurInstIterator - As we scan instructions optimizing them, this is the
-    /// next instruction to optimize.  Xforms that can invalidate this should
-    /// update it.
+    /// As we scan instructions optimizing them, this is the next instruction
+    /// to optimize. Transforms that can invalidate this should update it.
      BasicBlock::iterator CurInstIterator;
  
      /// Keeps track of non-local addresses that have been sunk into a block.
@@ -137,10 +134,10 @@ class TypePromotionTransaction;
      /// promotion for the current function.
      InstrToOrigTy PromotedInsts;
  
-    /// ModifiedDT - If CFG is modified in anyway.
+    /// True if CFG is modified in any way.
      bool ModifiedDT;
  
-    /// OptSize - True if optimizing for size.
+    /// True if optimizing for size.
      bool OptSize;
  
      /// DataLayout for the Function being processed.
@@ -163,30 +160,31 @@ class TypePromotionTransaction;
      }
  
    private:
-    bool EliminateFallThrough(Function &F);
-    bool EliminateMostlyEmptyBlocks(Function &F);
-    bool CanMergeBlocks(const BasicBlock *BB, const BasicBlock *DestBB) const;
-    void EliminateMostlyEmptyBlock(BasicBlock *BB);
-    bool OptimizeBlock(BasicBlock &BB, bool& ModifiedDT);
-    bool OptimizeInst(Instruction *I, bool& ModifiedDT);
-    bool OptimizeMemoryInst(Instruction *I, Value *Addr,
+    bool eliminateFallThrough(Function &F);
+    bool eliminateMostlyEmptyBlocks(Function &F);
+    bool canMergeBlocks(const BasicBlock *BB, const BasicBlock *DestBB) const;
+    void eliminateMostlyEmptyBlock(BasicBlock *BB);
+    bool optimizeBlock(BasicBlock &BB, bool& ModifiedDT);
+    bool optimizeInst(Instruction *I, bool& ModifiedDT);
+    bool optimizeMemoryInst(Instruction *I, Value *Addr,
                              Type *AccessTy, unsigned AS);
-    bool OptimizeInlineAsmInst(CallInst *CS);
-    bool OptimizeCallInst(CallInst *CI, bool& ModifiedDT);
-    bool MoveExtToFormExtLoad(Instruction *&I);
-    bool OptimizeExtUses(Instruction *I);
-    bool OptimizeSelectInst(SelectInst *SI);
-    bool OptimizeShuffleVectorInst(ShuffleVectorInst *SI);
-    bool OptimizeExtractElementInst(Instruction *Inst);
-    bool DupRetToEnableTailCallOpts(BasicBlock *BB);
-    bool PlaceDbgValues(Function &F);
+    bool optimizeInlineAsmInst(CallInst *CS);
+    bool optimizeCallInst(CallInst *CI, bool& ModifiedDT);
+    bool moveExtToFormExtLoad(Instruction *&I);
+    bool optimizeExtUses(Instruction *I);
+    bool optimizeSelectInst(SelectInst *SI);
+    bool optimizeShuffleVectorInst(ShuffleVectorInst *SI);
+    bool optimizeExtractElementInst(Instruction *Inst);
+    bool dupRetToEnableTailCallOpts(BasicBlock *BB);
+    bool placeDbgValues(Function &F);
      bool sinkAndCmp(Function &F);
-    bool ExtLdPromotion(TypePromotionTransaction &TPT, LoadInst *&LI,
+    bool extLdPromotion(TypePromotionTransaction &TPT, LoadInst *&LI,
                          Instruction *&Inst,
                          const SmallVectorImpl<Instruction *> &Exts,
                          unsigned CreatedInstCost);
      bool splitBranchCondition(Function &F);
      bool simplifyOffsetableRelocate(Instruction &I);
+    void stripInvariantGroupMetadata(Instruction &I);
    };
  }
  
@@ -214,8 +212,7 @@ bool CodeGenPrepare::runOnFunction(Function &F) {
      TLI = TM->getSubtargetImpl(F)->getTargetLowering();
    TLInfo = &getAnalysis<TargetLibraryInfoWrapperPass>().getTLI();
    TTI = &getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);
-  // FIXME: Use Function::optForSize().
-  OptSize = F.hasFnAttribute(Attribute::OptimizeForSize);
+  OptSize = F.optForSize();
  
    /// This optimization identifies DIV instructions that can be
    /// profitably bypassed and carried out with a shorter, faster divide.
@@ -228,12 +225,12 @@ bool CodeGenPrepare::runOnFunction(Function &F) {
  
    // Eliminate blocks that contain only PHI nodes and an
    // unconditional branch.
-  EverMadeChange |= EliminateMostlyEmptyBlocks(F);
+  EverMadeChange |= eliminateMostlyEmptyBlocks(F);
  
    // llvm.dbg.value is far away from the value then iSel may not be able
    // handle it properly. iSel will drop llvm.dbg.value if it can not
    // find a node corresponding to the value.
-  EverMadeChange |= PlaceDbgValues(F);
+  EverMadeChange |= placeDbgValues(F);
  
    // If there is a mask, compare against zero, and branch that can be combined
    // into a single target instruction, push the mask and compare into branch
@@ -250,7 +247,7 @@ bool CodeGenPrepare::runOnFunction(Function &F) {
      for (Function::iterator I = F.begin(); I != F.end(); ) {
        BasicBlock *BB = I++;
        bool ModifiedDTOnIteration = false;
-      MadeChange |= OptimizeBlock(*BB, ModifiedDTOnIteration);
+      MadeChange |= optimizeBlock(*BB, ModifiedDTOnIteration);
  
        // Restart BB iteration if the dominator tree of the Function was changed
        if (ModifiedDTOnIteration)
@@ -293,7 +290,7 @@ bool CodeGenPrepare::runOnFunction(Function &F) {
      // Merge pairs of basic blocks with unconditional branches, connected by
      // a single edge.
      if (EverMadeChange || MadeChange)
-      MadeChange |= EliminateFallThrough(F);
+      MadeChange |= eliminateFallThrough(F);
  
      EverMadeChange |= MadeChange;
    }
@@ -311,10 +308,10 @@ bool CodeGenPrepare::runOnFunction(Function &F) {
    return EverMadeChange;
  }
  
-/// EliminateFallThrough - Merge basic blocks which are connected
-/// by a single edge, where one of the basic blocks has a single successor
-/// pointing to the other basic block, which has a single predecessor.
-bool CodeGenPrepare::EliminateFallThrough(Function &F) {
+/// Merge basic blocks which are connected by a single edge, where one of the
+/// basic blocks has a single successor pointing to the other basic block,
+/// which has a single predecessor.
+bool CodeGenPrepare::eliminateFallThrough(Function &F) {
    bool Changed = false;
    // Scan all of the blocks in the function, except for the entry block.
    for (Function::iterator I = std::next(F.begin()), E = F.end(); I != E;) {
@@ -345,12 +342,11 @@ bool CodeGenPrepare::EliminateFallThrough(Function &F) {
    return Changed;
  }
  
-/// EliminateMostlyEmptyBlocks - eliminate blocks that contain only PHI nodes,
-/// debug info directives, and an unconditional branch.  Passes before isel
-/// (e.g. LSR/loopsimplify) often split edges in ways that are non-optimal for
-/// isel.  Start by eliminating these blocks so we can split them the way we
-/// want them.
-bool CodeGenPrepare::EliminateMostlyEmptyBlocks(Function &F) {
+/// Eliminate blocks that contain only PHI nodes, debug info directives, and an
+/// unconditional branch. Passes before isel (e.g. LSR/loopsimplify) often split
+/// edges in ways that are non-optimal for isel. Start by eliminating these
+/// blocks so we can split them the way we want them.
+bool CodeGenPrepare::eliminateMostlyEmptyBlocks(Function &F) {
    bool MadeChange = false;
    // Note that this intentionally skips the entry block.
    for (Function::iterator I = std::next(F.begin()), E = F.end(); I != E;) {
@@ -380,19 +376,19 @@ bool CodeGenPrepare::EliminateMostlyEmptyBlocks(Function &F) {
      if (DestBB == BB)
        continue;
  
-    if (!CanMergeBlocks(BB, DestBB))
+    if (!canMergeBlocks(BB, DestBB))
        continue;
  
-    EliminateMostlyEmptyBlock(BB);
+    eliminateMostlyEmptyBlock(BB);
      MadeChange = true;
    }
    return MadeChange;
  }
  
-/// CanMergeBlocks - Return true if we can merge BB into DestBB if there is a
-/// single uncond branch between them, and BB contains no other non-phi
+/// Return true if we can merge BB into DestBB if there is a single
+/// unconditional branch between them, and BB contains no other non-phi
  /// instructions.
-bool CodeGenPrepare::CanMergeBlocks(const BasicBlock *BB,
+bool CodeGenPrepare::canMergeBlocks(const BasicBlock *BB,
                                      const BasicBlock *DestBB) const {
    // We only want to eliminate blocks whose phi nodes are used by phi nodes in
    // the successor.  If there are more complex condition (e.g. preheaders),
@@ -458,9 +454,9 @@ bool CodeGenPrepare::CanMergeBlocks(const BasicBlock *BB,
  }
  
  
-/// EliminateMostlyEmptyBlock - Eliminate a basic block that have only phi's and
-/// an unconditional branch in it.
-void CodeGenPrepare::EliminateMostlyEmptyBlock(BasicBlock *BB) {
+/// Eliminate a basic block that has only phi's and an unconditional branch in
+/// it.
+void CodeGenPrepare::eliminateMostlyEmptyBlock(BasicBlock *BB) {
    BranchInst *BI = cast<BranchInst>(BB->getTerminator());
    BasicBlock *DestBB = BI->getSuccessor(0);
  
@@ -748,10 +744,9 @@ static bool SinkCast(CastInst *CI) {
    return MadeChange;
  }
  
-/// OptimizeNoopCopyExpression - If the specified cast instruction is a noop
-/// copy (e.g. it's casting from one pointer type to another, i32->i8 on PPC),
-/// sink it into user blocks to reduce the number of virtual
-/// registers that must be created and coalesced.
+/// If the specified cast instruction is a noop copy (e.g. it's casting from
+/// one pointer type to another, i32->i8 on PPC), sink it into user blocks to
+/// reduce the number of virtual registers that must be created and coalesced.
  ///
  /// Return true if any changes are made.
  ///
@@ -786,8 +781,8 @@ static bool OptimizeNoopCopyExpression(CastInst *CI, const TargetLowering &TLI,
    return SinkCast(CI);
  }
  
-/// CombineUAddWithOverflow - try to combine CI into a call to the
-/// llvm.uadd.with.overflow intrinsic if possible.
+/// Try to combine CI into a call to the llvm.uadd.with.overflow intrinsic if
+/// possible.
  ///
  /// Return true if any changes were made.
  static bool CombineUAddWithOverflow(CmpInst *CI) {
@@ -833,16 +828,16 @@ static bool CombineUAddWithOverflow(CmpInst *CI) {
    return true;
  }
  
-/// SinkCmpExpression - Sink the given CmpInst into user blocks to reduce
-/// the number of virtual registers that must be created and coalesced.  This is
-/// a clear win except on targets with multiple condition code registers
-///  (PowerPC), where it might lose; some adjustment may be wanted there.
+/// Sink the given CmpInst into user blocks to reduce the number of virtual
+/// registers that must be created and coalesced. This is a clear win except on
+/// targets with multiple condition code registers (PowerPC), where it might
+/// lose; some adjustment may be wanted there.
  ///
  /// Return true if any changes are made.
  static bool SinkCmpExpression(CmpInst *CI) {
    BasicBlock *DefBB = CI->getParent();
  
-  /// InsertedCmp - Only insert a cmp in each block once.
+  /// Only insert a cmp in each block once.
    DenseMap<BasicBlock*, CmpInst*> InsertedCmps;
  
    bool MadeChange = false;
@@ -900,8 +895,8 @@ static bool OptimizeCmpExpression(CmpInst *CI) {
    return false;
  }
  
-/// isExtractBitsCandidateUse - Check if the candidates could
-/// be combined with shift instruction, which includes:
+/// Check if the candidates could be combined with a shift instruction, which
+/// includes:
  /// 1. Truncate instruction
  /// 2. And instruction and the imm is a mask of the low bits:
  /// imm & (imm+1) == 0
@@ -919,8 +914,7 @@ static bool isExtractBitsCandidateUse(Instruction *User) {
    return true;
  }
  
-/// SinkShiftAndTruncate - sink both shift and truncate instruction
-/// to the use of truncate's BB.
+/// Sink both shift and truncate instruction to the use of truncate's BB.
  static bool
  SinkShiftAndTruncate(BinaryOperator *ShiftI, Instruction *User, ConstantInt *CI,
                       DenseMap<BasicBlock *, BinaryOperator *> &InsertedShifts,
@@ -990,10 +984,10 @@ SinkShiftAndTruncate(BinaryOperator *ShiftI, Instruction *User, ConstantInt *CI,
    return MadeChange;
  }
  
-/// OptimizeExtractBits - sink the shift *right* instruction into user blocks if
-/// the uses could potentially be combined with this shift instruction and
-/// generate BitExtract instruction. It will only be applied if the architecture
-/// supports BitExtract instruction. Here is an example:
+/// Sink the shift *right* instruction into user blocks if the uses could
+/// potentially be combined with this shift instruction and generate BitExtract
+/// instruction. It will only be applied if the architecture supports BitExtract
+/// instruction. Here is an example:
  /// BB1:
  ///   %x.extract.shift = lshr i64 %arg1, 32
  /// BB2:
@@ -1086,10 +1080,10 @@ static bool OptimizeExtractBits(BinaryOperator *ShiftI, ConstantInt *CI,
    return MadeChange;
  }
  
-//  ScalarizeMaskedLoad() translates masked load intrinsic, like 
+// Translate a masked load intrinsic like
  // <16 x i32 > @llvm.masked.load( <16 x i32>* %addr, i32 align,
  //                               <16 x i1> %mask, <16 x i32> %passthru)
-// to a chain of basic blocks, whith loading element one-by-one if
+// to a chain of basic blocks, with loading element one-by-one if
  // the appropriate mask bit is set
  // 
  //  %1 = bitcast i8* %addr to i32*
@@ -1205,7 +1199,7 @@ static void ScalarizeMaskedLoad(CallInst *CI) {
    CI->eraseFromParent();
  }
  
-//  ScalarizeMaskedStore() translates masked store intrinsic, like
+// Translate a masked store intrinsic, like
  // void @llvm.masked.store(<16 x i32> %src, <16 x i32>* %addr, i32 align,
  //                               <16 x i1> %mask)
  // to a chain of basic blocks, that stores element one-by-one if
@@ -1292,7 +1286,7 @@ static void ScalarizeMaskedStore(CallInst *CI) {
    CI->eraseFromParent();
  }
  
-bool CodeGenPrepare::OptimizeCallInst(CallInst *CI, bool& ModifiedDT) {
+bool CodeGenPrepare::optimizeCallInst(CallInst *CI, bool& ModifiedDT) {
    BasicBlock *BB = CI->getParent();
  
    // Lower inline assembly if we can.
@@ -1308,7 +1302,7 @@ bool CodeGenPrepare::OptimizeCallInst(CallInst *CI, bool& ModifiedDT) {
        return true;
      }
      // Sink address computing for memory operands into the block.
-    if (OptimizeInlineAsmInst(CI))
+    if (optimizeInlineAsmInst(CI))
        return true;
    }
  
@@ -1412,6 +1406,10 @@ bool CodeGenPrepare::OptimizeCallInst(CallInst *CI, bool& ModifiedDT) {
        InsertedInsts.insert(ExtVal);
        return true;
      }
+    case Intrinsic::invariant_group_barrier:
+      II->replaceAllUsesWith(II->getArgOperand(0));
+      II->eraseFromParent();
+      return true;
      }
  
      if (TLI) {
@@ -1423,7 +1421,7 @@ bool CodeGenPrepare::OptimizeCallInst(CallInst *CI, bool& ModifiedDT) {
        Type *AccessTy;
        if (TLI->GetAddrModeArguments(II, PtrOps, AccessTy, AddrSpace))
          while (!PtrOps.empty())
-          if (OptimizeMemoryInst(II, PtrOps.pop_back_val(), AccessTy, AddrSpace))
+          if (optimizeMemoryInst(II, PtrOps.pop_back_val(), AccessTy, AddrSpace))
              return true;
      }
    }
@@ -1444,9 +1442,8 @@ bool CodeGenPrepare::OptimizeCallInst(CallInst *CI, bool& ModifiedDT) {
    return false;
  }
  
-/// DupRetToEnableTailCallOpts - Look for opportunities to duplicate return
-/// instructions to the predecessor to enable tail call optimizations. The
-/// case it is currently looking for is:
+/// Look for opportunities to duplicate return instructions to the predecessor
+/// to enable tail call optimizations. The case it is currently looking for is:
  /// @code
  /// bb0:
  ///   %tmp0 = tail call i32 @f0()
@@ -1475,7 +1472,7 @@ bool CodeGenPrepare::OptimizeCallInst(CallInst *CI, bool& ModifiedDT) {
  ///   %tmp2 = tail call i32 @f2()
  ///   ret i32 %tmp2
  /// @endcode
-bool CodeGenPrepare::DupRetToEnableTailCallOpts(BasicBlock *BB) {
+bool CodeGenPrepare::dupRetToEnableTailCallOpts(BasicBlock *BB) {
    if (!TLI)
      return false;
  
@@ -1594,7 +1591,7 @@ bool CodeGenPrepare::DupRetToEnableTailCallOpts(BasicBlock *BB) {
  
  namespace {
  
-/// ExtAddrMode - This is an extended version of TargetLowering::AddrMode
+/// This is an extended version of TargetLowering::AddrMode
  /// which holds actual Value*'s for register values.
  struct ExtAddrMode : public TargetLowering::AddrMode {
    Value *BaseReg;
@@ -2108,7 +2105,7 @@ class AddressingModeMatcher {
    unsigned AddrSpace;
    Instruction *MemoryInst;
  
-  /// AddrMode - This is the addressing mode that we're building up.  This is
+  /// This is the addressing mode that we're building up. This is
    /// part of the return value of this addressing mode matching stuff.
    ExtAddrMode &AddrMode;
  
@@ -2119,9 +2116,8 @@ class AddressingModeMatcher {
    /// The ongoing transaction where every action should be registered.
    TypePromotionTransaction &TPT;
  
-  /// IgnoreProfitability - This is set to true when we should not do
-  /// profitability checks.  When true, IsProfitableToFoldIntoAddressingMode
-  /// always returns true.
+  /// This is set to true when we should not do profitability checks.
+  /// When true, IsProfitableToFoldIntoAddressingMode always returns true.
    bool IgnoreProfitability;
  
    AddressingModeMatcher(SmallVectorImpl<Instruction *> &AMI,
@@ -2140,7 +2136,7 @@ class AddressingModeMatcher {
    }
  public:
  
-  /// Match - Find the maximal addressing mode that a load/store of V can fold,
+  /// Find the maximal addressing mode that a load/store of V can fold,
    /// give an access type of AccessTy.  This returns a list of involved
    /// instructions in AddrModeInsts.
    /// \p InsertedInsts The instructions inserted by other CodeGenPrepare
@@ -2158,32 +2154,32 @@ public:
  
      bool Success = AddressingModeMatcher(AddrModeInsts, TM, AccessTy, AS,
                                           MemoryInst, Result, InsertedInsts,
-                                         PromotedInsts, TPT).MatchAddr(V, 0);
+                                         PromotedInsts, TPT).matchAddr(V, 0);
      (void)Success; assert(Success && "Couldn't select *anything*?");
      return Result;
    }
  private:
-  bool MatchScaledValue(Value *ScaleReg, int64_t Scale, unsigned Depth);
-  bool MatchAddr(Value *V, unsigned Depth);
-  bool MatchOperationAddr(User *Operation, unsigned Opcode, unsigned Depth,
+  bool matchScaledValue(Value *ScaleReg, int64_t Scale, unsigned Depth);
+  bool matchAddr(Value *V, unsigned Depth);
+  bool matchOperationAddr(User *Operation, unsigned Opcode, unsigned Depth,
                            bool *MovedAway = nullptr);
-  bool IsProfitableToFoldIntoAddressingMode(Instruction *I,
+  bool isProfitableToFoldIntoAddressingMode(Instruction *I,
                                              ExtAddrMode &AMBefore,
                                              ExtAddrMode &AMAfter);
-  bool ValueAlreadyLiveAtInst(Value *Val, Value *KnownLive1, Value *KnownLive2);
-  bool IsPromotionProfitable(unsigned NewCost, unsigned OldCost,
+  bool valueAlreadyLiveAtInst(Value *Val, Value *KnownLive1, Value *KnownLive2);
+  bool isPromotionProfitable(unsigned NewCost, unsigned OldCost,
                               Value *PromotedOperand) const;
  };
  
-/// MatchScaledValue - Try adding ScaleReg*Scale to the current addressing mode.
+/// Try adding ScaleReg*Scale to the current addressing mode.
  /// Return true and update AddrMode if this addr mode is legal for the target,
  /// false if not.
-bool AddressingModeMatcher::MatchScaledValue(Value *ScaleReg, int64_t Scale,
+bool AddressingModeMatcher::matchScaledValue(Value *ScaleReg, int64_t Scale,
                                               unsigned Depth) {
    // If Scale is 1, then this is the same as adding ScaleReg to the addressing
    // mode.  Just process that directly.
    if (Scale == 1)
-    return MatchAddr(ScaleReg, Depth);
+    return matchAddr(ScaleReg, Depth);
  
    // If the scale is 0, it takes nothing to add this.
    if (Scale == 0)
@@ -2230,9 +2226,9 @@ bool AddressingModeMatcher::MatchScaledValue(Value *ScaleReg, int64_t Scale,
    return true;
  }
  
-/// MightBeFoldableInst - This is a little filter, which returns true if an
-/// addressing computation involving I might be folded into a load/store
-/// accessing it.  This doesn't need to be perfect, but needs to accept at least
+/// This is a little filter, which returns true if an addressing computation
+/// involving I might be folded into a load/store accessing it.
+/// This doesn't need to be perfect, but needs to accept at least
  /// the set of instructions that MatchOperationAddr can.
  static bool MightBeFoldableInst(Instruction *I) {
    switch (I->getOpcode()) {
@@ -2628,8 +2624,7 @@ Value *TypePromotionHelper::promoteOperandForOther(
    return ExtOpnd;
  }
  
-/// IsPromotionProfitable - Check whether or not promoting an instruction
-/// to a wider type was profitable.
+/// Check whether or not promoting an instruction to a wider type is profitable.
  /// \p NewCost gives the cost of extension instructions created by the
  /// promotion.
  /// \p OldCost gives the cost of extension instructions before the promotion
@@ -2637,7 +2632,7 @@ Value *TypePromotionHelper::promoteOperandForOther(
  /// matched in the addressing mode the promotion.
  /// \p PromotedOperand is the value that has been promoted.
  /// \return True if the promotion is profitable, false otherwise.
-bool AddressingModeMatcher::IsPromotionProfitable(
+bool AddressingModeMatcher::isPromotionProfitable(
      unsigned NewCost, unsigned OldCost, Value *PromotedOperand) const {
    DEBUG(dbgs() << "OldCost: " << OldCost << "\tNewCost: " << NewCost << '\n');
    // The cost of the new extensions is greater than the cost of the
@@ -2653,9 +2648,9 @@ bool AddressingModeMatcher::IsPromotionProfitable(
    return isPromotedInstructionLegal(TLI, DL, PromotedOperand);
  }
  
-/// MatchOperationAddr - Given an instruction or constant expr, see if we can
-/// fold the operation into the addressing mode.  If so, update the addressing
-/// mode and return true, otherwise return false without modifying AddrMode.
+/// Given an instruction or constant expr, see if we can fold the operation
+/// into the addressing mode. If so, update the addressing  mode and return
+/// true, otherwise return false without modifying AddrMode.
  /// If \p MovedAway is not NULL, it contains the information of whether or
  /// not AddrInst has to be folded into the addressing mode on success.
  /// If \p MovedAway == true, \p AddrInst will not be part of the addressing
@@ -2664,7 +2659,7 @@ bool AddressingModeMatcher::IsPromotionProfitable(
  /// This state can happen when AddrInst is a sext, since it may be moved away.
  /// Therefore, AddrInst may not be valid when MovedAway is true and it must
  /// not be referenced anymore.
-bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
+bool AddressingModeMatcher::matchOperationAddr(User *AddrInst, unsigned Opcode,
                                                 unsigned Depth,
                                                 bool *MovedAway) {
    // Avoid exponential behavior on extremely deep expression trees.
@@ -2677,13 +2672,13 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
    switch (Opcode) {
    case Instruction::PtrToInt:
      // PtrToInt is always a noop, as we know that the int type is pointer sized.
-    return MatchAddr(AddrInst->getOperand(0), Depth);
+    return matchAddr(AddrInst->getOperand(0), Depth);
    case Instruction::IntToPtr: {
      auto AS = AddrInst->getType()->getPointerAddressSpace();
      auto PtrTy = MVT::getIntegerVT(DL.getPointerSizeInBits(AS));
      // This inttoptr is a no-op if the integer type is pointer sized.
      if (TLI.getValueType(DL, AddrInst->getOperand(0)->getType()) == PtrTy)
-      return MatchAddr(AddrInst->getOperand(0), Depth);
+      return matchAddr(AddrInst->getOperand(0), Depth);
      return false;
    }
    case Instruction::BitCast:
@@ -2695,14 +2690,14 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
          // and we don't want to mess around with them.  Assume it knows what it
          // is doing.
          AddrInst->getOperand(0)->getType() != AddrInst->getType())
-      return MatchAddr(AddrInst->getOperand(0), Depth);
+      return matchAddr(AddrInst->getOperand(0), Depth);
      return false;
    case Instruction::AddrSpaceCast: {
      unsigned SrcAS
        = AddrInst->getOperand(0)->getType()->getPointerAddressSpace();
      unsigned DestAS = AddrInst->getType()->getPointerAddressSpace();
      if (TLI.isNoopAddrSpaceCast(SrcAS, DestAS))
-      return MatchAddr(AddrInst->getOperand(0), Depth);
+      return matchAddr(AddrInst->getOperand(0), Depth);
      return false;
    }
    case Instruction::Add: {
@@ -2716,8 +2711,8 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
      TypePromotionTransaction::ConstRestorationPt LastKnownGood =
          TPT.getRestorationPoint();
  
-    if (MatchAddr(AddrInst->getOperand(1), Depth+1) &&
-        MatchAddr(AddrInst->getOperand(0), Depth+1))
+    if (matchAddr(AddrInst->getOperand(1), Depth+1) &&
+        matchAddr(AddrInst->getOperand(0), Depth+1))
        return true;
  
      // Restore the old addr mode info.
@@ -2726,8 +2721,8 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
      TPT.rollback(LastKnownGood);
  
      // Otherwise this was over-aggressive.  Try merging in the LHS then the RHS.
-    if (MatchAddr(AddrInst->getOperand(0), Depth+1) &&
-        MatchAddr(AddrInst->getOperand(1), Depth+1))
+    if (matchAddr(AddrInst->getOperand(0), Depth+1) &&
+        matchAddr(AddrInst->getOperand(1), Depth+1))
        return true;
  
      // Otherwise we definitely can't merge the ADD in.
@@ -2749,7 +2744,7 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
      if (Opcode == Instruction::Shl)
        Scale = 1LL << Scale;
  
-    return MatchScaledValue(AddrInst->getOperand(0), Scale, Depth);
+    return matchScaledValue(AddrInst->getOperand(0), Scale, Depth);
    }
    case Instruction::GetElementPtr: {
      // Scan the GEP.  We check it if it contains constant offsets and at most
@@ -2788,7 +2783,7 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
        if (ConstantOffset == 0 ||
            TLI.isLegalAddressingMode(DL, AddrMode, AccessTy, AddrSpace)) {
          // Check to see if we can fold the base pointer in too.
-        if (MatchAddr(AddrInst->getOperand(0), Depth+1))
+        if (matchAddr(AddrInst->getOperand(0), Depth+1))
            return true;
        }
        AddrMode.BaseOffs -= ConstantOffset;
@@ -2803,7 +2798,7 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
      AddrMode.BaseOffs += ConstantOffset;
  
      // Match the base operand of the GEP.
-    if (!MatchAddr(AddrInst->getOperand(0), Depth+1)) {
+    if (!matchAddr(AddrInst->getOperand(0), Depth+1)) {
        // If it couldn't be matched, just stuff the value in a register.
        if (AddrMode.HasBaseReg) {
          AddrMode = BackupAddrMode;
@@ -2815,7 +2810,7 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
      }
  
      // Match the remaining variable portion of the GEP.
-    if (!MatchScaledValue(AddrInst->getOperand(VariableOperand), VariableScale,
+    if (!matchScaledValue(AddrInst->getOperand(VariableOperand), VariableScale,
                            Depth)) {
        // If it couldn't be matched, try stuffing the base into a register
        // instead of matching it, and retrying the match of the scale.
@@ -2826,7 +2821,7 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
        AddrMode.HasBaseReg = true;
        AddrMode.BaseReg = AddrInst->getOperand(0);
        AddrMode.BaseOffs += ConstantOffset;
-      if (!MatchScaledValue(AddrInst->getOperand(VariableOperand),
+      if (!matchScaledValue(AddrInst->getOperand(VariableOperand),
                              VariableScale, Depth)) {
          // If even that didn't work, bail.
          AddrMode = BackupAddrMode;
@@ -2876,12 +2871,12 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
      ExtAddrMode BackupAddrMode = AddrMode;
      unsigned OldSize = AddrModeInsts.size();
  
-    if (!MatchAddr(PromotedOperand, Depth) ||
+    if (!matchAddr(PromotedOperand, Depth) ||
          // The total of the new cost is equals to the cost of the created
          // instructions.
          // The total of the old cost is equals to the cost of the extension plus
          // what we have saved in the addressing mode.
-        !IsPromotionProfitable(CreatedInstsCost,
+        !isPromotionProfitable(CreatedInstsCost,
                                 ExtCost + (AddrModeInsts.size() - OldSize),
                                 PromotedOperand)) {
        AddrMode = BackupAddrMode;
@@ -2896,12 +2891,12 @@ bool AddressingModeMatcher::MatchOperationAddr(User *AddrInst, unsigned Opcode,
    return false;
  }
  
-/// MatchAddr - If we can, try to add the value of 'Addr' into the current
-/// addressing mode.  If Addr can't be added to AddrMode this returns false and
-/// leaves AddrMode unmodified.  This assumes that Addr is either a pointer type
-/// or intptr_t for the target.
+/// If we can, try to add the value of 'Addr' into the current addressing mode.
+/// If Addr can't be added to AddrMode this returns false and leaves AddrMode
+/// unmodified. This assumes that Addr is either a pointer type or intptr_t
+/// for the target.
  ///
-bool AddressingModeMatcher::MatchAddr(Value *Addr, unsigned Depth) {
+bool AddressingModeMatcher::matchAddr(Value *Addr, unsigned Depth) {
    // Start a transaction at this point that we will rollback if the matching
    // fails.
    TypePromotionTransaction::ConstRestorationPt LastKnownGood =
@@ -2926,7 +2921,7 @@ bool AddressingModeMatcher::MatchAddr(Value *Addr, unsigned Depth) {
  
      // Check to see if it is possible to fold this operation.
      bool MovedAway = false;
-    if (MatchOperationAddr(I, I->getOpcode(), Depth, &MovedAway)) {
+    if (matchOperationAddr(I, I->getOpcode(), Depth, &MovedAway)) {
        // This instruction may have been move away. If so, there is nothing
        // to check here.
        if (MovedAway)
@@ -2935,7 +2930,7 @@ bool AddressingModeMatcher::MatchAddr(Value *Addr, unsigned Depth) {
        // *profitable* to do so.  We use a simple cost model to avoid increasing
        // register pressure too much.
        if (I->hasOneUse() ||
-          IsProfitableToFoldIntoAddressingMode(I, BackupAddrMode, AddrMode)) {
+          isProfitableToFoldIntoAddressingMode(I, BackupAddrMode, AddrMode)) {
          AddrModeInsts.push_back(I);
          return true;
        }
@@ -2947,7 +2942,7 @@ bool AddressingModeMatcher::MatchAddr(Value *Addr, unsigned Depth) {
        TPT.rollback(LastKnownGood);
      }
    } else if (ConstantExpr *CE = dyn_cast<ConstantExpr>(Addr)) {
-    if (MatchOperationAddr(CE, CE->getOpcode(), Depth))
+    if (matchOperationAddr(CE, CE->getOpcode(), Depth))
        return true;
      TPT.rollback(LastKnownGood);
    } else if (isa<ConstantPointerNull>(Addr)) {
@@ -2980,9 +2975,8 @@ bool AddressingModeMatcher::MatchAddr(Value *Addr, unsigned Depth) {
    return false;
  }
  
-/// IsOperandAMemoryOperand - Check to see if all uses of OpVal by the specified
-/// inline asm call are due to memory operands.  If so, return true, otherwise
-/// return false.
+/// Check to see if all uses of OpVal by the specified inline asm call are due
+/// to memory operands. If so, return true, otherwise return false.
  static bool IsOperandAMemoryOperand(CallInst *CI, InlineAsm *IA, Value *OpVal,
                                      const TargetMachine &TM) {
    const Function *F = CI->getParent()->getParent();
@@ -3008,8 +3002,8 @@ static bool IsOperandAMemoryOperand(CallInst *CI, InlineAsm *IA, Value *OpVal,
    return true;
  }
  
-/// FindAllMemoryUses - Recursively walk all the uses of I until we find a
-/// memory use.  If we find an obviously non-foldable instruction, return true.
+/// Recursively walk all the uses of I until we find a memory use.
+/// If we find an obviously non-foldable instruction, return true.
  /// Add the ultimately found memory instructions to MemoryUses.
  static bool FindAllMemoryUses(
      Instruction *I,
@@ -3060,7 +3054,7 @@ static bool FindAllMemoryUses(
  /// the use site that we're folding it into.  If so, there is no cost to
  /// include it in the addressing mode.  KnownLive1 and KnownLive2 are two values
  /// that we know are live at the instruction already.
-bool AddressingModeMatcher::ValueAlreadyLiveAtInst(Value *Val,Value *KnownLive1,
+bool AddressingModeMatcher::valueAlreadyLiveAtInst(Value *Val,Value *KnownLive1,
                                                     Value *KnownLive2) {
    // If Val is either of the known-live values, we know it is live!
    if (Val == nullptr || Val == KnownLive1 || Val == KnownLive2)
@@ -3082,11 +3076,11 @@ bool AddressingModeMatcher::ValueAlreadyLiveAtInst(Value *Val,Value *KnownLive1,
    return Val->isUsedInBasicBlock(MemoryInst->getParent());
  }
  
-/// IsProfitableToFoldIntoAddressingMode - It is possible for the addressing
-/// mode of the machine to fold the specified instruction into a load or store
-/// that ultimately uses it.  However, the specified instruction has multiple
-/// uses.  Given this, it may actually increase register pressure to fold it
-/// into the load.  For example, consider this code:
+/// It is possible for the addressing mode of the machine to fold the specified
+/// instruction into a load or store that ultimately uses it.
+/// However, the specified instruction has multiple uses.
+/// Given this, it may actually increase register pressure to fold it
+/// into the load. For example, consider this code:
  ///
  ///     X = ...
  ///     Y = X+1
@@ -3104,7 +3098,7 @@ bool AddressingModeMatcher::ValueAlreadyLiveAtInst(Value *Val,Value *KnownLive1,
  /// X was live across 'load Z' for other reasons, we actually *would* want to
  /// fold the addressing mode in the Z case.  This would make Y die earlier.
  bool AddressingModeMatcher::
-IsProfitableToFoldIntoAddressingMode(Instruction *I, ExtAddrMode &AMBefore,
+isProfitableToFoldIntoAddressingMode(Instruction *I, ExtAddrMode &AMBefore,
                                       ExtAddrMode &AMAfter) {
    if (IgnoreProfitability) return true;
  
@@ -3121,9 +3115,9 @@ IsProfitableToFoldIntoAddressingMode(Instruction *I, ExtAddrMode &AMBefore,
  
    // If the BaseReg or ScaledReg was referenced by the previous addrmode, their
    // lifetime wasn't extended by adding this instruction.
-  if (ValueAlreadyLiveAtInst(BaseReg, AMBefore.BaseReg, AMBefore.ScaledReg))
+  if (valueAlreadyLiveAtInst(BaseReg, AMBefore.BaseReg, AMBefore.ScaledReg))
      BaseReg = nullptr;
-  if (ValueAlreadyLiveAtInst(ScaledReg, AMBefore.BaseReg, AMBefore.ScaledReg))
+  if (valueAlreadyLiveAtInst(ScaledReg, AMBefore.BaseReg, AMBefore.ScaledReg))
      ScaledReg = nullptr;
  
    // If folding this instruction (and it's subexprs) didn't extend any live
@@ -3168,7 +3162,7 @@ IsProfitableToFoldIntoAddressingMode(Instruction *I, ExtAddrMode &AMBefore,
                                    MemoryInst, Result, InsertedInsts,
                                    PromotedInsts, TPT);
      Matcher.IgnoreProfitability = true;
-    bool Success = Matcher.MatchAddr(Address, 0);
+    bool Success = Matcher.matchAddr(Address, 0);
      (void)Success; assert(Success && "Couldn't select *anything*?");
  
      // The match was to check the profitability, the changes made are not
@@ -3189,7 +3183,7 @@ IsProfitableToFoldIntoAddressingMode(Instruction *I, ExtAddrMode &AMBefore,
  
  } // end anonymous namespace
  
-/// IsNonLocalValue - Return true if the specified values are defined in a
+/// Return true if the specified values are defined in a
  /// different basic block than BB.
  static bool IsNonLocalValue(Value *V, BasicBlock *BB) {
    if (Instruction *I = dyn_cast<Instruction>(V))
@@ -3197,16 +3191,15 @@ static bool IsNonLocalValue(Value *V, BasicBlock *BB) {
    return false;
  }
  
-/// OptimizeMemoryInst - Load and Store Instructions often have
-/// addressing modes that can do significant amounts of computation.  As such,
-/// instruction selection will try to get the load or store to do as much
-/// computation as possible for the program.  The problem is that isel can only
-/// see within a single block.  As such, we sink as much legal addressing mode
-/// stuff into the block as possible.
+/// Load and Store Instructions often have addressing modes that can do
+/// significant amounts of computation. As such, instruction selection will try
+/// to get the load or store to do as much computation as possible for the
+/// program. The problem is that isel can only see within a single block. As
+/// such, we sink as much legal addressing mode work into the block as possible.
  ///
  /// This method is used to optimize both load/store and inline asms with memory
  /// operands.
-bool CodeGenPrepare::OptimizeMemoryInst(Instruction *MemoryInst, Value *Addr,
+bool CodeGenPrepare::optimizeMemoryInst(Instruction *MemoryInst, Value *Addr,
                                          Type *AccessTy, unsigned AddrSpace) {
    Value *Repl = Addr;
  
@@ -3543,10 +3536,9 @@ bool CodeGenPrepare::OptimizeMemoryInst(Instruction *MemoryInst, Value *Addr,
    return true;
  }
  
-/// OptimizeInlineAsmInst - If there are any memory operands, use
-/// OptimizeMemoryInst to sink their address computing into the block when
-/// possible / profitable.
-bool CodeGenPrepare::OptimizeInlineAsmInst(CallInst *CS) {
+/// If there are any memory operands, use OptimizeMemoryInst to sink their
+/// address computing into the block when possible / profitable.
+bool CodeGenPrepare::optimizeInlineAsmInst(CallInst *CS) {
    bool MadeChange = false;
  
    const TargetRegisterInfo *TRI =
@@ -3563,7 +3555,7 @@ bool CodeGenPrepare::OptimizeInlineAsmInst(CallInst *CS) {
      if (OpInfo.ConstraintType == TargetLowering::C_Memory &&
          OpInfo.isIndirect) {
        Value *OpVal = CS->getArgOperand(ArgNo++);
-      MadeChange |= OptimizeMemoryInst(CS, OpVal, OpVal->getType(), ~0u);
+      MadeChange |= optimizeMemoryInst(CS, OpVal, OpVal->getType(), ~0u);
      } else if (OpInfo.Type == InlineAsm::isInput)
        ArgNo++;
    }
@@ -3643,7 +3635,7 @@ static bool hasSameExtUse(Instruction *Inst, const TargetLowering &TLI) {
  /// %add = add nuw i64 %zext, 4
  /// \encode
  /// Thanks to the promotion, we can match zext(load i32*) to i64.
-bool CodeGenPrepare::ExtLdPromotion(TypePromotionTransaction &TPT,
+bool CodeGenPrepare::extLdPromotion(TypePromotionTransaction &TPT,
                                      LoadInst *&LI, Instruction *&Inst,
                                      const SmallVectorImpl<Instruction *> &Exts,
                                      unsigned CreatedInstsCost = 0) {
@@ -3693,7 +3685,7 @@ bool CodeGenPrepare::ExtLdPromotion(TypePromotionTransaction &TPT,
      }
      // The promotion is profitable.
      // Check if it exposes an ext(load).
-    (void)ExtLdPromotion(TPT, LI, Inst, NewExts, TotalCreatedInstsCost);
+    (void)extLdPromotion(TPT, LI, Inst, NewExts, TotalCreatedInstsCost);
      if (LI && (StressExtLdPromotion || NewCreatedInstsCost <= ExtCost ||
                 // If we have created a new extension, i.e., now we have two
                 // extensions. We must make sure one of them is merged with
@@ -3710,13 +3702,13 @@ bool CodeGenPrepare::ExtLdPromotion(TypePromotionTransaction &TPT,
    return false;
  }
  
-/// MoveExtToFormExtLoad - Move a zext or sext fed by a load into the same
-/// basic block as the load, unless conditions are unfavorable. This allows
-/// SelectionDAG to fold the extend into the load.
+/// Move a zext or sext fed by a load into the same basic block as the load,
+/// unless conditions are unfavorable. This allows SelectionDAG to fold the
+/// extend into the load.
  /// \p I[in/out] the extension may be modified during the process if some
  /// promotions apply.
  ///
-bool CodeGenPrepare::MoveExtToFormExtLoad(Instruction *&I) {
+bool CodeGenPrepare::moveExtToFormExtLoad(Instruction *&I) {
    // Try to promote a chain of computation if it allows to form
    // an extended load.
    TypePromotionTransaction TPT;
@@ -3727,7 +3719,7 @@ bool CodeGenPrepare::MoveExtToFormExtLoad(Instruction *&I) {
    // Look for a load being extended.
    LoadInst *LI = nullptr;
    Instruction *OldExt = I;
-  bool HasPromoted = ExtLdPromotion(TPT, LI, I, Exts);
+  bool HasPromoted = extLdPromotion(TPT, LI, I, Exts);
    if (!LI || !I) {
      assert(!HasPromoted && !LI && "If we did not match any load instruction "
                                    "the code must remain the same");
@@ -3777,7 +3769,7 @@ bool CodeGenPrepare::MoveExtToFormExtLoad(Instruction *&I) {
    return true;
  }
  
-bool CodeGenPrepare::OptimizeExtUses(Instruction *I) {
+bool CodeGenPrepare::optimizeExtUses(Instruction *I) {
    BasicBlock *DefBB = I->getParent();
  
    // If the result of a {s|z}ext and its source are both live out, rewrite all
@@ -3848,8 +3840,7 @@ bool CodeGenPrepare::OptimizeExtUses(Instruction *I) {
    return MadeChange;
  }
  
-/// isFormingBranchFromSelectProfitable - Returns true if a SelectInst should be
-/// turned into an explicit branch.
+/// Returns true if a SelectInst should be turned into an explicit branch.
  static bool isFormingBranchFromSelectProfitable(SelectInst *SI) {
    // FIXME: This should use the same heuristics as IfConversion to determine
    // whether a select is better represented as a branch.  This requires that
@@ -3858,28 +3849,27 @@ static bool isFormingBranchFromSelectProfitable(SelectInst *SI) {
  
    CmpInst *Cmp = dyn_cast<CmpInst>(SI->getCondition());
  
-  // If the branch is predicted right, an out of order CPU can avoid blocking on
-  // the compare.  Emit cmovs on compares with a memory operand as branches to
-  // avoid stalls on the load from memory.  If the compare has more than one use
-  // there's probably another cmov or setcc around so it's not worth emitting a
-  // branch.
-  if (!Cmp)
+  // If a branch is predictable, an out-of-order CPU can avoid blocking on its
+  // comparison condition. If the compare has more than one use, there's
+  // probably another cmov or setcc around, so it's not worth emitting a branch.
+  if (!Cmp || !Cmp->hasOneUse())
      return false;
  
    Value *CmpOp0 = Cmp->getOperand(0);
    Value *CmpOp1 = Cmp->getOperand(1);
  
-  // We check that the memory operand has one use to avoid uses of the loaded
-  // value directly after the compare, making branches unprofitable.
-  return Cmp->hasOneUse() &&
-         ((isa<LoadInst>(CmpOp0) && CmpOp0->hasOneUse()) ||
+  // Emit "cmov on compare with a memory operand" as a branch to avoid stalls
+  // on a load from memory. But if the load is used more than once, do not
+  // change the select to a branch because the load is probably needed
+  // regardless of whether the branch is taken or not.
+  return ((isa<LoadInst>(CmpOp0) && CmpOp0->hasOneUse()) ||
            (isa<LoadInst>(CmpOp1) && CmpOp1->hasOneUse()));
  }
  
  
  /// If we have a SelectInst that will likely profit from branch prediction,
  /// turn it into a branch.
-bool CodeGenPrepare::OptimizeSelectInst(SelectInst *SI) {
+bool CodeGenPrepare::optimizeSelectInst(SelectInst *SI) {
    bool VectorCond = !SI->getCondition()->getType()->isIntegerTy(1);
  
    // Can we convert the 'select' to CF ?
@@ -3952,7 +3942,7 @@ static bool isBroadcastShuffle(ShuffleVectorInst *SVI) {
  /// (e.g. x86 only introduced "vpsllvd" and friends with AVX2). In these cases
  /// it's often worth sinking a shufflevector splat down to its use so that
  /// codegen can spot all lanes are identical.
-bool CodeGenPrepare::OptimizeShuffleVectorInst(ShuffleVectorInst *SVI) {
+bool CodeGenPrepare::optimizeShuffleVectorInst(ShuffleVectorInst *SVI) {
    BasicBlock *DefBB = SVI->getParent();
  
    // Only do this xform if variable vector shifts are particularly expensive.
@@ -4135,7 +4125,7 @@ class VectorPromoteHelper {
    /// \brief Generate a constant vector with \p Val with the same
    /// number of elements as the transition.
    /// \p UseSplat defines whether or not \p Val should be replicated
-  /// accross the whole vector.
+  /// across the whole vector.
    /// In other words, if UseSplat == true, we generate <Val, Val, ..., Val>,
    /// otherwise we generate a vector with as many undef as possible:
    /// <undef, ..., undef, Val, undef, ..., undef> where \p Val is only
@@ -4317,7 +4307,7 @@ void VectorPromoteHelper::promoteImpl(Instruction *ToBePromoted) {
  /// Some targets can do store(extractelement) with one instruction.
  /// Try to push the extractelement towards the stores when the target
  /// has this feature and this is profitable.
-bool CodeGenPrepare::OptimizeExtractElementInst(Instruction *Inst) {
+bool CodeGenPrepare::optimizeExtractElementInst(Instruction *Inst) {
    unsigned CombineCost = UINT_MAX;
    if (DisableStoreExtract || !TLI ||
        (!StressStoreExtract &&
@@ -4369,7 +4359,7 @@ bool CodeGenPrepare::OptimizeExtractElementInst(Instruction *Inst) {
    return false;
  }
  
-bool CodeGenPrepare::OptimizeInst(Instruction *I, bool& ModifiedDT) {
+bool CodeGenPrepare::optimizeInst(Instruction *I, bool& ModifiedDT) {
    // Bail out if we inserted the instruction to prevent optimizations from
    // stepping on each other's toes.
    if (InsertedInsts.count(I))
@@ -4410,8 +4400,8 @@ bool CodeGenPrepare::OptimizeInst(Instruction *I, bool& ModifiedDT) {
                TargetLowering::TypeExpandInteger) {
          return SinkCast(CI);
        } else {
-        bool MadeChange = MoveExtToFormExtLoad(I);
-        return MadeChange | OptimizeExtUses(I);
+        bool MadeChange = moveExtToFormExtLoad(I);
+        return MadeChange | optimizeExtUses(I);
        }
      }
      return false;
@@ -4422,17 +4412,19 @@ bool CodeGenPrepare::OptimizeInst(Instruction *I, bool& ModifiedDT) {
        return OptimizeCmpExpression(CI);
  
    if (LoadInst *LI = dyn_cast<LoadInst>(I)) {
+    stripInvariantGroupMetadata(*LI);
      if (TLI) {
        unsigned AS = LI->getPointerAddressSpace();
-      return OptimizeMemoryInst(I, I->getOperand(0), LI->getType(), AS);
+      return optimizeMemoryInst(I, I->getOperand(0), LI->getType(), AS);
      }
      return false;
    }
  
    if (StoreInst *SI = dyn_cast<StoreInst>(I)) {
+    stripInvariantGroupMetadata(*SI);
      if (TLI) {
        unsigned AS = SI->getPointerAddressSpace();
-      return OptimizeMemoryInst(I, SI->getOperand(1),
+      return optimizeMemoryInst(I, SI->getOperand(1),
                                  SI->getOperand(0)->getType(), AS);
      }
      return false;
@@ -4457,23 +4449,23 @@ bool CodeGenPrepare::OptimizeInst(Instruction *I, bool& ModifiedDT) {
        GEPI->replaceAllUsesWith(NC);
        GEPI->eraseFromParent();
        ++NumGEPsElim;
-      OptimizeInst(NC, ModifiedDT);
+      optimizeInst(NC, ModifiedDT);
        return true;
      }
      return false;
    }
  
    if (CallInst *CI = dyn_cast<CallInst>(I))
-    return OptimizeCallInst(CI, ModifiedDT);
+    return optimizeCallInst(CI, ModifiedDT);
  
    if (SelectInst *SI = dyn_cast<SelectInst>(I))
-    return OptimizeSelectInst(SI);
+    return optimizeSelectInst(SI);
  
    if (ShuffleVectorInst *SVI = dyn_cast<ShuffleVectorInst>(I))
-    return OptimizeShuffleVectorInst(SVI);
+    return optimizeShuffleVectorInst(SVI);
  
    if (isa<ExtractElementInst>(I))
-    return OptimizeExtractElementInst(I);
+    return optimizeExtractElementInst(I);
  
    return false;
  }
@@ -4481,17 +4473,17 @@ bool CodeGenPrepare::OptimizeInst(Instruction *I, bool& ModifiedDT) {
  // In this pass we look for GEP and cast instructions that are used
  // across basic blocks and rewrite them to improve basic-block-at-a-time
  // selection.
-bool CodeGenPrepare::OptimizeBlock(BasicBlock &BB, bool& ModifiedDT) {
+bool CodeGenPrepare::optimizeBlock(BasicBlock &BB, bool& ModifiedDT) {
    SunkAddrs.clear();
    bool MadeChange = false;
  
    CurInstIterator = BB.begin();
    while (CurInstIterator != BB.end()) {
-    MadeChange |= OptimizeInst(CurInstIterator++, ModifiedDT);
+    MadeChange |= optimizeInst(CurInstIterator++, ModifiedDT);
      if (ModifiedDT)
        return true;
    }
-  MadeChange |= DupRetToEnableTailCallOpts(&BB);
+  MadeChange |= dupRetToEnableTailCallOpts(&BB);
  
    return MadeChange;
  }
@@ -4499,7 +4491,7 @@ bool CodeGenPrepare::OptimizeBlock(BasicBlock &BB, bool& ModifiedDT) {
  // llvm.dbg.value is far away from the value then iSel may not be able
  // handle it properly. iSel will drop llvm.dbg.value if it can not
  // find a node corresponding to the value.
-bool CodeGenPrepare::PlaceDbgValues(Function &F) {
+bool CodeGenPrepare::placeDbgValues(Function &F) {
    bool MadeChange = false;
    for (BasicBlock &BB : F) {
      Instruction *PrevNonDbgInst = nullptr;
@@ -4668,6 +4660,10 @@ bool CodeGenPrepare::splitBranchCondition(Function &F) {
      if (!match(BB.getTerminator(), m_Br(m_OneUse(m_BinOp(LogicOp)), TBB, FBB)))
        continue;
  
+    auto *Br1 = cast<BranchInst>(BB.getTerminator());
+    if (Br1->getMetadata(LLVMContext::MD_unpredictable))
+      continue;
+
      unsigned Opc;
      Value *Cond1, *Cond2;
      if (match(LogicOp, m_And(m_OneUse(m_Value(Cond1)),
@@ -4694,7 +4690,6 @@ bool CodeGenPrepare::splitBranchCondition(Function &F) {
  
      // Update original basic block by using the first condition directly by the
      // branch instruction and removing the no longer needed and/or instruction.
-    auto *Br1 = cast<BranchInst>(BB.getTerminator());
      Br1->setCondition(Cond1);
      LogicOp->eraseFromParent();
  
@@ -4825,3 +4820,8 @@ bool CodeGenPrepare::splitBranchCondition(Function &F) {
    }
    return MadeChange;
  }
+
+void CodeGenPrepare::stripInvariantGroupMetadata(Instruction &I) {
+  if (auto *InvariantMD = I.getMetadata(LLVMContext::MD_invariant_group))
+    I.dropUnknownNonDebugMetadata(InvariantMD->getMetadataID());
+}