[AVX-512] Remove another extra space from the Intel syntax asm strings.

[oota-llvm.git] / lib / Target / X86 / X86Subtarget.h
diff --git a/lib/Target/X86/X86Subtarget.h b/lib/Target/X86/X86Subtarget.h

index 71bdd53f1d068c1ec5c70a689b8caa84638c496f..13d1026dcaa0b0f32cbba94b7b1ab0d669f6527d 100644 (file)
--- a/lib/Target/X86/X86Subtarget.h
+++ b/lib/Target/X86/X86Subtarget.h
@@ -47,11 +47,11 @@ class X86Subtarget final : public X86GenSubtargetInfo {
  
  protected:
    enum X86SSEEnum {
-    NoMMXSSE, MMX, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, AVX, AVX2, AVX512F
+    NoSSE, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, AVX, AVX2, AVX512F
    };
  
    enum X863DNowEnum {
-    NoThreeDNow, ThreeDNow, ThreeDNowA
+    NoThreeDNow, MMX, ThreeDNow, ThreeDNowA
    };
  
    enum X86ProcFamilyEnum {
@@ -64,10 +64,10 @@ protected:
    /// Which PIC style to use
    PICStyles::Style PICStyle;
  
-  /// MMX, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, or none supported.
+  /// SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, or none supported.
    X86SSEEnum X86SSELevel;
  
-  /// 3DNow, 3DNow Athlon, or none supported.
+  /// MMX, 3DNow, 3DNow Athlon, or none supported.
    X863DNowEnum X863DNowLevel;
  
    /// True if this processor has conditional move instructions
@@ -86,6 +86,18 @@ protected:
    /// Target has AES instructions
    bool HasAES;
  
+  /// Target has FXSAVE/FXRESTOR instructions
+  bool HasFXSR;
+
+  /// Target has XSAVE instructions
+  bool HasXSAVE;
+  /// Target has XSAVEOPT instructions
+  bool HasXSAVEOPT;
+  /// Target has XSAVEC instructions
+  bool HasXSAVEC;
+  /// Target has XSAVES instructions
+  bool HasXSAVES;
+
    /// Target has carry-less multiplication
    bool HasPCLMUL;
  
@@ -134,17 +146,14 @@ protected:
    /// Processor has SHA instructions.
    bool HasSHA;
  
-  /// Processor has SGX instructions.
-  bool HasSGX;
-
    /// Processor has PRFCHW instructions.
    bool HasPRFCHW;
  
    /// Processor has RDSEED instructions.
    bool HasRDSEED;
  
-  /// Processor has SMAP instructions.
-  bool HasSMAP;
+  /// Processor has LAHF/SAHF instructions.
+  bool HasLAHFSAHF;
  
    /// True if BT (bit test) of memory instructions are slow.
    bool IsBTMemSlow;
@@ -152,10 +161,10 @@ protected:
    /// True if SHLD instructions are slow.
    bool IsSHLDSlow;
  
-  /// True if unaligned memory access is fast.
-  bool IsUAMemFast;
+  /// True if unaligned memory accesses of 16-bytes are slow.
+  bool IsUAMem16Slow;
  
-  /// True if unaligned 32-byte memory accesses are slow.
+  /// True if unaligned memory accesses of 32-bytes are slow.
    bool IsUAMem32Slow;
  
    /// True if SSE operations can have unaligned memory operands.
@@ -196,16 +205,6 @@ protected:
    /// True if INC and DEC instructions are slow when writing to flags
    bool SlowIncDec;
  
-  /// Use the RSQRT* instructions to optimize square root calculations.
-  /// For this to be profitable, the cost of FSQRT and FDIV must be
-  /// substantially higher than normal FP ops like FADD and FMUL.
-  bool UseSqrtEst;
-
-  /// Use the RCP* instructions to optimize FP division calculations.
-  /// For this to be profitable, the cost of FDIV must be
-  /// substantially higher than normal FP ops like FADD and FMUL.
-  bool UseReciprocalEst;
-
    /// Processor has AVX-512 PreFetch Instructions
    bool HasPFI;
  
@@ -224,6 +223,15 @@ protected:
    /// Processor has AVX-512 Vector Length eXtenstions
    bool HasVLX;
  
+  /// Processor has PKU extenstions
+  bool HasPKU;
+
+  /// Processot supports MPX - Memory Protection Extensions
+  bool HasMPX;
+
+  /// Use software floating point for code generation.
+  bool UseSoftFloat;
+
    /// The minimum alignment known to hold of the stack frame on
    /// entry to the function and which must be maintained by every function.
    unsigned stackAlignment;
@@ -263,9 +271,8 @@ public:
    /// This constructor initializes the data members to match that
    /// of the specified triple.
    ///
-  X86Subtarget(const std::string &TT, const std::string &CPU,
-               const std::string &FS, const X86TargetMachine &TM,
-               unsigned StackAlignOverride);
+  X86Subtarget(const Triple &TT, const std::string &CPU, const std::string &FS,
+               const X86TargetMachine &TM, unsigned StackAlignOverride);
  
    const X86TargetLowering *getTargetLowering() const override {
      return &TLInfo;
@@ -330,7 +337,6 @@ public:
    void setPICStyle(PICStyles::Style Style)  { PICStyle = Style; }
  
    bool hasCMov() const { return HasCMov; }
-  bool hasMMX() const { return X86SSELevel >= MMX; }
    bool hasSSE1() const { return X86SSELevel >= SSE1; }
    bool hasSSE2() const { return X86SSELevel >= SSE2; }
    bool hasSSE3() const { return X86SSELevel >= SSE3; }
@@ -343,14 +349,22 @@ public:
    bool hasFp256() const { return hasAVX(); }
    bool hasInt256() const { return hasAVX2(); }
    bool hasSSE4A() const { return HasSSE4A; }
+  bool hasMMX() const { return X863DNowLevel >= MMX; }
    bool has3DNow() const { return X863DNowLevel >= ThreeDNow; }
    bool has3DNowA() const { return X863DNowLevel >= ThreeDNowA; }
    bool hasPOPCNT() const { return HasPOPCNT; }
    bool hasAES() const { return HasAES; }
+  bool hasFXSR() const { return HasFXSR; }
+  bool hasXSAVE() const { return HasXSAVE; }
+  bool hasXSAVEOPT() const { return HasXSAVEOPT; }
+  bool hasXSAVEC() const { return HasXSAVEC; }
+  bool hasXSAVES() const { return HasXSAVES; }
    bool hasPCLMUL() const { return HasPCLMUL; }
-  bool hasFMA() const { return HasFMA; }
-  // FIXME: Favor FMA when both are enabled. Is this the right thing to do?
-  bool hasFMA4() const { return HasFMA4 && !HasFMA; }
+  // Prefer FMA4 to FMA - its better for commutation/memory folding and
+  // has equal or better performance on all supported targets.
+  bool hasFMA() const { return HasFMA && !HasFMA4; }
+  bool hasFMA4() const { return HasFMA4; }
+  bool hasAnyFMA() const { return hasFMA() || hasFMA4() || hasAVX512(); }
    bool hasXOP() const { return HasXOP; }
    bool hasTBM() const { return HasTBM; }
    bool hasMOVBE() const { return HasMOVBE; }
@@ -364,13 +378,12 @@ public:
    bool hasHLE() const { return HasHLE; }
    bool hasADX() const { return HasADX; }
    bool hasSHA() const { return HasSHA; }
-  bool hasSGX() const { return HasSGX; }
    bool hasPRFCHW() const { return HasPRFCHW; }
    bool hasRDSEED() const { return HasRDSEED; }
-  bool hasSMAP() const { return HasSMAP; }
+  bool hasLAHFSAHF() const { return HasLAHFSAHF; }
    bool isBTMemSlow() const { return IsBTMemSlow; }
    bool isSHLDSlow() const { return IsSHLDSlow; }
-  bool isUnalignedMemAccessFast() const { return IsUAMemFast; }
+  bool isUnalignedMem16Slow() const { return IsUAMem16Slow; }
    bool isUnalignedMem32Slow() const { return IsUAMem32Slow; }
    bool hasSSEUnalignedMem() const { return HasSSEUnalignedMem; }
    bool hasCmpxchg16b() const { return HasCmpxchg16b; }
@@ -382,17 +395,18 @@ public:
    bool LEAusesAG() const { return LEAUsesAG; }
    bool slowLEA() const { return SlowLEA; }
    bool slowIncDec() const { return SlowIncDec; }
-  bool useSqrtEst() const { return UseSqrtEst; }
-  bool useReciprocalEst() const { return UseReciprocalEst; }
    bool hasCDI() const { return HasCDI; }
    bool hasPFI() const { return HasPFI; }
    bool hasERI() const { return HasERI; }
    bool hasDQI() const { return HasDQI; }
    bool hasBWI() const { return HasBWI; }
    bool hasVLX() const { return HasVLX; }
+  bool hasPKU() const { return HasPKU; }
+  bool hasMPX() const { return HasMPX; }
  
    bool isAtom() const { return X86ProcFamily == IntelAtom; }
    bool isSLM() const { return X86ProcFamily == IntelSLM; }
+  bool useSoftFloat() const { return UseSoftFloat; }
  
    const Triple &getTargetTriple() const { return TargetTriple; }
  
@@ -407,9 +421,11 @@ public:
    bool isTargetMachO() const { return TargetTriple.isOSBinFormatMachO(); }
  
    bool isTargetLinux() const { return TargetTriple.isOSLinux(); }
+  bool isTargetAndroid() const { return TargetTriple.isAndroid(); }
    bool isTargetNaCl() const { return TargetTriple.isOSNaCl(); }
    bool isTargetNaCl32() const { return isTargetNaCl() && !is64Bit(); }
    bool isTargetNaCl64() const { return isTargetNaCl() && is64Bit(); }
+  bool isTargetMCU() const { return TargetTriple.isOSIAMCU(); }
  
    bool isTargetWindowsMSVC() const {
      return TargetTriple.isWindowsMSVCEnvironment();
@@ -419,6 +435,10 @@ public:
      return TargetTriple.isKnownWindowsMSVCEnvironment();
    }
  
+  bool isTargetWindowsCoreCLR() const {
+    return TargetTriple.isWindowsCoreCLREnvironment();
+  }
+
    bool isTargetWindowsCygwin() const {
      return TargetTriple.isWindowsCygwinEnvironment();
    }
@@ -460,8 +480,26 @@ public:
    }
  
    bool isCallingConvWin64(CallingConv::ID CC) const {
-    return (isTargetWin64() && CC != CallingConv::X86_64_SysV) ||
-           CC == CallingConv::X86_64_Win64;
+    switch (CC) {
+    // On Win64, all these conventions just use the default convention.
+    case CallingConv::C:
+    case CallingConv::Fast:
+    case CallingConv::X86_FastCall:
+    case CallingConv::X86_StdCall:
+    case CallingConv::X86_ThisCall:
+    case CallingConv::X86_VectorCall:
+    case CallingConv::Intel_OCL_BI:
+      return isTargetWin64();
+    // This convention allows using the Win64 convention on other targets.
+    case CallingConv::X86_64_Win64:
+      return true;
+    // This convention allows using the SysV convention on Windows targets.
+    case CallingConv::X86_64_SysV:
+      return false;
+    // Otherwise, who knows what this is.
+    default:
+      return false;
+    }
    }
  
    /// ClassifyGlobalReference - Classify a global variable reference for the