[x86] enable machine combiner reassociations for scalar single-precision minimums

[oota-llvm.git] / lib / Target / X86 / X86InstrInfo.cpp
diff --git a/lib/Target/X86/X86InstrInfo.cpp b/lib/Target/X86/X86InstrInfo.cpp

index efa972ad9a9c77fcf707258d4854de514e18ff43..bd3a3e5165da4349f27b281f6999da2edaebbc4a 100644 (file)
--- a/lib/Target/X86/X86InstrInfo.cpp
+++ b/lib/Target/X86/X86InstrInfo.cpp
@@ -2456,7 +2456,7 @@ inline static unsigned getTruncatedShiftCount(MachineInstr *MI,
  inline static bool isTruncatedShiftCountForLEA(unsigned ShAmt) {
    // Left shift instructions can be transformed into load-effective-address
    // instructions if we can encode them appropriately.
-  // A LEA instruction utilizes a SIB byte to encode it's scale factor.
+  // A LEA instruction utilizes a SIB byte to encode its scale factor.
    // The SIB.scale field is two bits wide which means that we can encode any
    // shift amount less than 4.
    return ShAmt < 4 && ShAmt > 0;
@@ -4763,8 +4763,8 @@ static void expandLoadStackGuard(MachineInstrBuilder &MIB,
    const GlobalValue *GV =
        cast<GlobalValue>((*MIB->memoperands_begin())->getValue());
    unsigned Flag = MachineMemOperand::MOLoad | MachineMemOperand::MOInvariant;
-  MachineMemOperand *MMO = MBB.getParent()->
-      getMachineMemOperand(MachinePointerInfo::getGOT(), Flag, 8, 8);
+  MachineMemOperand *MMO = MBB.getParent()->getMachineMemOperand(
+      MachinePointerInfo::getGOT(*MBB.getParent()), Flag, 8, 8);
    MachineBasicBlock::iterator I = MIB.getInstr();
  
    BuildMI(MBB, I, DL, TII.get(X86::MOV64rm), Reg).addReg(X86::RIP).addImm(1)
@@ -6385,11 +6385,17 @@ static bool hasReassociableSibling(const MachineInstr &Inst, bool &Commuted) {
  // TODO: There are many more machine instruction opcodes to match:
  //       1. Other data types (integer, vectors)
  //       2. Other math / logic operations (and, or)
+//       3. Other forms of the same operation (intrinsics and other variants)
  static bool isAssociativeAndCommutative(const MachineInstr &Inst) {
    switch (Inst.getOpcode()) {
    case X86::IMUL16rr:
    case X86::IMUL32rr:
    case X86::IMUL64rr:
+  // Normal min/max instructions are not commutative because of NaN and signed
+  // zero semantics, but these are. Thus, there's no need to check for global
+  // relaxed math; the instructions themselves have the properties we need.
+  case X86::MINCSSrr:
+  case X86::VMINCSSrr:
      return true;
    case X86::ADDPDrr:
    case X86::ADDPSrr:
@@ -6401,10 +6407,14 @@ static bool isAssociativeAndCommutative(const MachineInstr &Inst) {
    case X86::MULSSrr:
    case X86::VADDPDrr:
    case X86::VADDPSrr:
+  case X86::VADDPDYrr:
+  case X86::VADDPSYrr:
    case X86::VADDSDrr:
    case X86::VADDSSrr:
    case X86::VMULPDrr:
    case X86::VMULPSrr:
+  case X86::VMULPDYrr:
+  case X86::VMULPSYrr:
    case X86::VMULSDrr:
    case X86::VMULSSrr:
      return Inst.getParent()->getParent()->getTarget().Options.UnsafeFPMath;