Revert r243250

[oota-llvm.git] / test / Analysis / CostModel / ARM / gep.ll
diff --git a/test/Analysis/CostModel/ARM/gep.ll b/test/Analysis/CostModel/ARM/gep.ll

index a70d6d42b61b6cdf9f57c42e57ee05324787171d..624ca113a3022bc7b1e7f7aa464c8f1b3f733edd 100644 (file)
--- a/test/Analysis/CostModel/ARM/gep.ll
+++ b/test/Analysis/CostModel/ARM/gep.ll
@@ -3,85 +3,41 @@
  target datalayout = "e-p:32:32:32-i1:8:32-i8:8:32-i16:16:32-i32:32:32-i64:32:64-f32:32:32-f64:32:64-v64:32:64-v128:32:128-a0:0:32-n32-S32"
  target triple = "thumbv7-apple-ios6.0.0"
  
-define void @test_geps(i32 %i) {
-  ; GEPs with index 0 are essentially NOOPs.
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i8, i8*
+define void @test_geps() {
+  ; Cost of scalar integer geps should be one. We can't always expect it to be
+  ; folded into the instruction addressing mode.
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds i8, i8*
    %a0 = getelementptr inbounds i8, i8* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i16, i16*
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds i16, i16*
    %a1 = getelementptr inbounds i16, i16* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i32, i32*
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds i32, i32*
    %a2 = getelementptr inbounds i32, i32* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i64, i64*
+
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds i64, i64*
    %a3 = getelementptr inbounds i64, i64* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds float, float*
+
+  ; Cost of scalar floating point geps should be one. We cannot fold the address
+  ; computation.
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds float, float*
    %a4 = getelementptr inbounds float, float* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds double, double*
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds double, double*
    %a5 = getelementptr inbounds double, double* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i8>, <4 x i8>*
+
+
+  ; Cost of vector geps should be one. We cannot fold the address computation.
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x i8>, <4 x i8>*
    %a7 = getelementptr inbounds <4 x i8>, <4 x i8>* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i16>, <4 x i16>*
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x i16>, <4 x i16>*
    %a8 = getelementptr inbounds <4 x i16>, <4 x i16>* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i32>, <4 x i32>*
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x i32>, <4 x i32>*
    %a9 = getelementptr inbounds <4 x i32>, <4 x i32>* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i64>, <4 x i64>*
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x i64>, <4 x i64>*
    %a10 = getelementptr inbounds <4 x i64>, <4 x i64>* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x float>, <4 x float>*
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x float>, <4 x float>*
    %a11 = getelementptr inbounds <4 x float>, <4 x float>* undef, i32 0
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x double>, <4 x double>*
+;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x double>, <4 x double>*
    %a12 = getelementptr inbounds <4 x double>, <4 x double>* undef, i32 0
  
-  ; Cost of GEPs is one if we cannot fold the address computation.
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i8, i8*
-  %b0 = getelementptr inbounds i8, i8* undef, i32 1024
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i16, i16*
-  %b1 = getelementptr inbounds i16, i16* undef, i32 1024
-  ; Thumb-2 cannot fold offset >= 2^12 into address computation.
-;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds i32, i32*
-  %b2 = getelementptr inbounds i32, i32* undef, i32 1024
-;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds i64, i64*
-  %b3 = getelementptr inbounds i64, i64* undef, i32 1024
-;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds float, float*
-  %b4 = getelementptr inbounds float, float* undef, i32 1024
-;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds double, double*
-  %b5 = getelementptr inbounds double, double* undef, i32 1024
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i8>, <4 x i8>*
-  %b7 = getelementptr inbounds <4 x i8>, <4 x i8>* undef, i32 1
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i16>, <4 x i16>*
-  %b8 = getelementptr inbounds <4 x i16>, <4 x i16>* undef, i32 1
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i32>, <4 x i32>*
-  %b9 = getelementptr inbounds <4 x i32>, <4 x i32>* undef, i32 1
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i64>, <4 x i64>*
-  %b10 = getelementptr inbounds <4 x i64>, <4 x i64>* undef, i32 1
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x float>, <4 x float>*
-  %b11 = getelementptr inbounds <4 x float>, <4 x float>* undef, i32 1
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x double>, <4 x double>*
-  %b12 = getelementptr inbounds <4 x double>, <4 x double>* undef, i32 1
-
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i8, i8*
-  %c0 = getelementptr inbounds i8, i8* undef, i32 %i
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i16, i16*
-  %c1 = getelementptr inbounds i16, i16* undef, i32 %i
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i32, i32*
-  %c2 = getelementptr inbounds i32, i32* undef, i32 %i
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds i64, i64*
-  %c3 = getelementptr inbounds i64, i64* undef, i32 %i
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds float, float*
-  %c4 = getelementptr inbounds float, float* undef, i32 %i
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds double, double*
-  %c5 = getelementptr inbounds double, double* undef, i32 %i
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i8>, <4 x i8>*
-  %c7 = getelementptr inbounds <4 x i8>, <4 x i8>* undef, i32 %i
-;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds <4 x i16>, <4 x i16>*
-  %c8 = getelementptr inbounds <4 x i16>, <4 x i16>* undef, i32 %i
-  ; Thumb-2 cannot fold scales larger than 8 to address computation.
-;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x i32>, <4 x i32>*
-  %c9 = getelementptr inbounds <4 x i32>, <4 x i32>* undef, i32 %i
-;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x i64>, <4 x i64>*
-  %c10 = getelementptr inbounds <4 x i64>, <4 x i64>* undef, i32 %i
-;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x float>, <4 x float>*
-  %c11 = getelementptr inbounds <4 x float>, <4 x float>* undef, i32 %i
-;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds <4 x double>, <4 x double>*
-  %c12 = getelementptr inbounds <4 x double>, <4 x double>* undef, i32 %i
  
    ret void
  }