AMDGPU/SI: Use flat for global load/store when targeting HSA

[oota-llvm.git] / lib / Target / AMDGPU / AMDGPU.td
diff --git a/lib/Target/AMDGPU/AMDGPU.td b/lib/Target/AMDGPU/AMDGPU.td

index 569ad3844b2533193ad5a24c485785a9946f56e3..5913bf7f773f4e497573ba90ad88c96275daa180 100644 (file)
--- a/lib/Target/AMDGPU/AMDGPU.td
+++ b/lib/Target/AMDGPU/AMDGPU.td
@@ -98,6 +98,21 @@ def FeatureEnableLoadStoreOpt : SubtargetFeature <"load-store-opt",
          "true",
          "Enable SI load/store optimizer pass">;
  
+// Performance debugging feature. Allow using DS instruction immediate
+// offsets even if the base pointer can't be proven to be base. On SI,
+// base pointer values that won't give the same result as a 16-bit add
+// are not safe to fold, but this will override the conservative test
+// for the base pointer.
+def FeatureEnableUnsafeDSOffsetFolding : SubtargetFeature <"unsafe-ds-offset-folding",
+        "EnableUnsafeDSOffsetFolding",
+        "true",
+        "Force using DS instruction immediate offsets on SI">;
+
+def FeatureFlatForGlobal : SubtargetFeature<"flat-for-global",
+        "FlatForGlobal",
+        "true",
+        "Force to generate flat instruction for global">;
+
  def FeatureFlatAddressSpace : SubtargetFeature<"flat-address-space",
          "FlatAddressSpace",
          "true",
@@ -113,6 +128,11 @@ def FeatureSGPRInitBug : SubtargetFeature<"sgpr-init-bug",
          "true",
          "VI SGPR initilization bug requiring a fixed SGPR allocation size">;
  
+def FeatureEnableHugeScratchBuffer : SubtargetFeature<"huge-scratch-buffer",
+        "EnableHugeScratchBuffer",
+        "true",
+        "Enable scratch buffer sizes greater than 128 GB">;
+
  class SubtargetFeatureFetchLimit <string Value> :
                            SubtargetFeature <"fetch"#Value,
          "TexVTXClauseSize",