R600/SI: Rename encoding field to match docs for VOP3b

[oota-llvm.git] / lib / Target / R600 / AMDGPUISelLowering.h
diff --git a/lib/Target/R600/AMDGPUISelLowering.h b/lib/Target/R600/AMDGPUISelLowering.h

index 5001116f5a06d1721cd88472de9a5b10bcc6e2f3..caf96539430a60892e9517b2ebd8f7568d309260 100644 (file)
--- a/lib/Target/R600/AMDGPUISelLowering.h
+++ b/lib/Target/R600/AMDGPUISelLowering.h
@@ -43,18 +43,25 @@ private:
    /// \brief Split a vector store into multiple scalar stores.
    /// \returns The resulting chain.
  
-  SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const;
+  SDValue LowerFREM(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerFCEIL(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerFTRUNC(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerFRINT(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerFNEARBYINT(SDValue Op, SelectionDAG &DAG) const;
+
+  SDValue LowerFROUND32(SDValue Op, SelectionDAG &DAG) const;
+  SDValue LowerFROUND64(SDValue Op, SelectionDAG &DAG) const;
+  SDValue LowerFROUND(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerFFLOOR(SDValue Op, SelectionDAG &DAG) const;
  
+  SDValue LowerINT_TO_FP64(SDValue Op, SelectionDAG &DAG, bool Signed) const;
    SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
+  SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
+
+  SDValue LowerFP64_TO_INT(SDValue Op, SelectionDAG &DAG, bool Signed) const;
+  SDValue LowerFP_TO_UINT(SDValue Op, SelectionDAG &DAG) const;
+  SDValue LowerFP_TO_SINT(SDValue Op, SelectionDAG &DAG) const;
  
-  SDValue ExpandSIGN_EXTEND_INREG(SDValue Op,
-                                  unsigned BitsDiff,
-                                  SelectionDAG &DAG) const;
    SDValue LowerSIGN_EXTEND_INREG(SDValue Op, SelectionDAG &DAG) const;
  
    SDValue performStoreCombine(SDNode *N, DAGCombinerInfo &DCI) const;
@@ -82,7 +89,10 @@ protected:
    SDValue LowerLOAD(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerSDIVREM(SDValue Op, SelectionDAG &DAG) const;
+  SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerDIVREM24(SDValue Op, SelectionDAG &DAG, bool sign) const;
+  void LowerUDIVREM64(SDValue Op, SelectionDAG &DAG,
+                                    SmallVectorImpl<SDValue> &Results) const;
    bool isHWTrueValue(SDValue Op) const;
    bool isHWFalseValue(SDValue Op) const;
  
@@ -100,7 +110,7 @@ protected:
                                const SmallVectorImpl<ISD::InputArg> &Ins) const;
  
  public:
-  AMDGPUTargetLowering(TargetMachine &TM);
+  AMDGPUTargetLowering(TargetMachine &TM, const AMDGPUSubtarget &STI);
  
    bool isFAbsFree(EVT VT) const override;
    bool isFNegFree(EVT VT) const override;
@@ -118,8 +128,14 @@ public:
  
    bool isFPImmLegal(const APFloat &Imm, EVT VT) const override;
    bool ShouldShrinkFPConstant(EVT VT) const override;
+  bool shouldReduceLoadWidth(SDNode *Load,
+                             ISD::LoadExtType ExtType,
+                             EVT ExtVT) const override;
  
    bool isLoadBitCastBeneficial(EVT, EVT) const override;
+  bool isCheapToSpeculateCttz() const override;
+  bool isCheapToSpeculateCtlz() const override;
+
    SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv,
                        bool isVarArg,
                        const SmallVectorImpl<ISD::OutputArg> &Outs,
@@ -136,9 +152,33 @@ public:
  
    SDValue LowerIntrinsicIABS(SDValue Op, SelectionDAG &DAG) const;
    SDValue LowerIntrinsicLRP(SDValue Op, SelectionDAG &DAG) const;
-  SDValue CombineMinMax(SDNode *N, SelectionDAG &DAG) const;
+  SDValue CombineFMinMaxLegacy(SDLoc DL,
+                               EVT VT,
+                               SDValue LHS,
+                               SDValue RHS,
+                               SDValue True,
+                               SDValue False,
+                               SDValue CC,
+                               DAGCombinerInfo &DCI) const;
+  SDValue CombineIMinMax(SDLoc DL,
+                         EVT VT,
+                         SDValue LHS,
+                         SDValue RHS,
+                         SDValue True,
+                         SDValue False,
+                         SDValue CC,
+                         SelectionDAG &DAG) const;
+
    const char* getTargetNodeName(unsigned Opcode) const override;
  
+  SDValue getRsqrtEstimate(SDValue Operand,
+                           DAGCombinerInfo &DCI,
+                           unsigned &RefinementSteps,
+                           bool &UseOneConstNR) const override;
+  SDValue getRecipEstimate(SDValue Operand,
+                           DAGCombinerInfo &DCI,
+                           unsigned &RefinementSteps) const override;
+
    virtual SDNode *PostISelFolding(MachineSDNode *N,
                                    SelectionDAG &DAG) const {
      return N;
@@ -153,10 +193,8 @@ public:
                                       const SelectionDAG &DAG,
                                       unsigned Depth = 0) const override;
  
-  virtual unsigned ComputeNumSignBitsForTargetNode(
-    SDValue Op,
-    const SelectionDAG &DAG,
-    unsigned Depth = 0) const override;
+  unsigned ComputeNumSignBitsForTargetNode(SDValue Op, const SelectionDAG &DAG,
+                                           unsigned Depth = 0) const override;
  
    /// \brief Helper function that adds Reg to the LiveIn list of the DAG's
    /// MachineFunction.
@@ -180,17 +218,24 @@ enum {
    DWORDADDR,
    FRACT,
    CLAMP,
+  MAD, // Multiply + add with same result as the separate operations.
  
    // SIN_HW, COS_HW - f32 for SI, 1 ULP max error, valid from -100 pi to 100 pi.
    // Denormals handled on some parts.
    COS_HW,
    SIN_HW,
-  FMAX,
+  FMAX_LEGACY,
    SMAX,
    UMAX,
-  FMIN,
+  FMIN_LEGACY,
    SMIN,
    UMIN,
+  FMAX3,
+  SMAX3,
+  UMAX3,
+  FMIN3,
+  SMIN3,
+  UMIN3,
    URECIP,
    DIV_SCALE,
    DIV_FMAS,
@@ -203,6 +248,8 @@ enum {
    RSQ,
    RSQ_LEGACY,
    RSQ_CLAMPED,
+  LDEXP,
+  FP_CLASS,
    DOT4,
    BFE_U32, // Extract range of bits with zero extension to 32-bits.
    BFE_I32, // Extract range of bits with sign extension to 32-bits.