X86: Remove pre-2010 dead code in mergeSPUpdatesDown

[oota-llvm.git] / lib / Target / X86 / X86ISelLowering.h
diff --git a/lib/Target/X86/X86ISelLowering.h b/lib/Target/X86/X86ISelLowering.h

index f63b821ce6a592fe6b7e2cc5c6e4577cad50e187..5d69c1fa188c1cdf0b7577c383a4978ab332a42c 100644 (file)
--- a/lib/Target/X86/X86ISelLowering.h
+++ b/lib/Target/X86/X86ISelLowering.h
@@ -158,6 +158,10 @@ namespace llvm {
        /// vector to a GPR.
        MMX_MOVD2W,
  
+      /// MMX_MOVW2D - Copies a GPR into the low 32-bit word of a MMX vector
+      /// and zero out the high word.
+      MMX_MOVW2D,
+
        /// PEXTRB - Extract an 8-bit value from a vector and zero extend it to
        /// i32, corresponds to X86::PEXTRB.
        PEXTRB,
@@ -190,9 +194,19 @@ namespace llvm {
        /// BLENDI - Blend where the selector is an immediate.
        BLENDI,
  
+      /// SHRUNKBLEND - Blend where the condition has been shrunk.
+      /// This is used to emphasize that the condition mask is
+      /// no more valid for generic VSELECT optimizations.
+      SHRUNKBLEND,
+
        /// ADDSUB - Combined add and sub on an FP vector.
        ADDSUB,
-
+      //  FADD, FSUB, FMUL, FDIV, FMIN, FMAX - FP vector ops with rounding mode.
+      FADD_RND,
+      FSUB_RND,
+      FMUL_RND,
+      FDIV_RND,
+      
        // SUBUS - Integer sub with unsigned saturation.
        SUBUS,
  
@@ -301,6 +315,13 @@ namespace llvm {
  
        UMUL, // LOW, HI, FLAGS = umul LHS, RHS
  
+      // 8-bit SMUL/UMUL - AX, FLAGS = smul8/umul8 AL, RHS
+      SMUL8, UMUL8,
+
+      // 8-bit divrem that zero-extend the high result (AH).
+      UDIVREM8_ZEXT_HREG,
+      SDIVREM8_SEXT_HREG,
+
        // MUL_IMM - X86 specific multiply by immediate.
        MUL_IMM,
  
@@ -366,6 +387,17 @@ namespace llvm {
        FNMSUB,
        FMADDSUB,
        FMSUBADD,
+      // FMA with rounding mode
+      FMADD_RND,
+      FNMADD_RND,
+      FMSUB_RND,
+      FNMSUB_RND,
+      FMADDSUB_RND,
+      FMSUBADD_RND,     
+
+      // Compress and expand
+      COMPRESS,
+      EXPAND,
  
        // Save xmm argument registers to the stack, according to %al. An operator
        // is needed so that this can be expanded with control flow.
@@ -407,6 +439,9 @@ namespace llvm {
        // Test if in transactional execution.
        XTEST,
  
+      // ERI instructions
+      RSQRT28, RCP28, EXP2,
+
        // Compare and swap.
        LCMPXCHG_DAG = ISD::FIRST_TARGET_MEMORY_OPCODE,
        LCMPXCHG8_DAG,
@@ -528,7 +563,8 @@ namespace llvm {
    //  X86 Implementation of the TargetLowering interface
    class X86TargetLowering final : public TargetLowering {
    public:
-    explicit X86TargetLowering(const X86TargetMachine &TM);
+    explicit X86TargetLowering(const X86TargetMachine &TM,
+                               const X86Subtarget &STI);
  
      unsigned getJumpTableEncoding() const override;
  
@@ -614,6 +650,10 @@ namespace llvm {
      /// This method returns the name of a target specific DAG node.
      const char *getTargetNodeName(unsigned Opcode) const override;
  
+    bool isCheapToSpeculateCttz() const override;
+
+    bool isCheapToSpeculateCtlz() const override;
+
      /// Return the value type to use for ISD::SETCC.
      EVT getSetCCResultType(LLVMContext &Context, EVT VT) const override;
  
@@ -709,6 +749,10 @@ namespace llvm {
      bool isZExtFree(EVT VT1, EVT VT2) const override;
      bool isZExtFree(SDValue Val, EVT VT2) const override;
  
+    /// Return true if folding a vector load into ExtVal (a sign, zero, or any
+    /// extend node) is profitable.
+    bool isVectorLoadExtDesirable(SDValue) const override;
+
      /// Return true if an FMA operation is faster than a pair of fmul and fadd
      /// instructions. fmuladd intrinsics will be expanded to FMAs when this
      /// method returns true, otherwise fmuladd is expanded to fmul + fadd.
@@ -747,9 +791,10 @@ namespace llvm {
        return !X86ScalarSSEf64 || VT == MVT::f80;
      }
  
-    const X86Subtarget* getSubtarget() const {
-      return Subtarget;
-    }
+    /// Return true if we believe it is correct and profitable to reduce the
+    /// load node to a smaller type.
+    bool shouldReduceLoadWidth(SDNode *Load, ISD::LoadExtType ExtTy,
+                               EVT NewVT) const override;
  
      /// Return true if the specified scalar FP type is computed in an SSE
      /// register, not on the X87 floating point stack.
@@ -772,6 +817,10 @@ namespace llvm {
      bool shouldConvertConstantLoadToIntImm(const APInt &Imm,
                                             Type *Ty) const override;
  
+    /// Return true if EXTRACT_SUBVECTOR is cheap for this result type
+    /// with this index.
+    bool isExtractSubvectorCheap(EVT ResVT, unsigned Index) const override;
+
      /// Intel processors have a unified instruction and data cache
      const char * getClearCacheBuiltinName() const override {
        return nullptr; // nothing to do, move along.
@@ -795,9 +844,6 @@ namespace llvm {
  
      bool isNoopAddrSpaceCast(unsigned SrcAS, unsigned DestAS) const override;
  
-    /// \brief Reset the operation actions based on target options.
-    void resetOperationActions() override;
-
      bool useLoadStackGuardNode() const override;
      /// \brief Customize the preferred legalization strategy for certain types.
      LegalizeTypeAction getPreferredVectorAction(EVT VT) const override;
@@ -812,10 +858,6 @@ namespace llvm {
      const X86Subtarget *Subtarget;
      const DataLayout *TD;
  
-    /// Used to store the TargetOptions so that we don't waste time resetting
-    /// the operation actions unless we have to.
-    TargetOptions TO;
-
      /// Select between SSE or x87 floating point ops.
      /// When SSE is available, use it for f32 operations.
      /// When SSE2 is available, use it for f64 operations.
@@ -1014,6 +1056,15 @@ namespace llvm {
  
      /// Convert a comparison if required by the subtarget.
      SDValue ConvertCmpIfNecessary(SDValue Cmp, SelectionDAG &DAG) const;
+
+    /// Use rsqrt* to speed up sqrt calculations.
+    SDValue getRsqrtEstimate(SDValue Operand, DAGCombinerInfo &DCI,
+                             unsigned &RefinementSteps,
+                             bool &UseOneConstNR) const override;
+
+    /// Use rcp* to speed up fdiv calculations.
+    SDValue getRecipEstimate(SDValue Operand, DAGCombinerInfo &DCI,
+                             unsigned &RefinementSteps) const override;
    };
  
    namespace X86 {