Improve the X86 cost model for loads and stores.

[oota-llvm.git] / test / Analysis / CostModel / X86 / vectorized-loop.ll
diff --git a/test/Analysis/CostModel/X86/vectorized-loop.ll b/test/Analysis/CostModel/X86/vectorized-loop.ll

index 6c9e111bb10f7b1a336b900d2e394a12cd49febb..25b11145c661ed5b779101a0a30a27fe15771c02 100644 (file)
--- a/test/Analysis/CostModel/X86/vectorized-loop.ll
+++ b/test/Analysis/CostModel/X86/vectorized-loop.ll
@@ -28,16 +28,17 @@ vector.body:                                      ; preds = %for.body.lr.ph, %ve
    %4 = getelementptr inbounds i32* %B, i64 %3
    ;CHECK: cost of 0 {{.*}} bitcast
    %5 = bitcast i32* %4 to <8 x i32>*
-  ;CHECK: cost of 1 {{.*}} load
+  ;CHECK: cost of 2 {{.*}} load
    %6 = load <8 x i32>* %5, align 4
    ;CHECK: cost of 4 {{.*}} mul
    %7 = mul nsw <8 x i32> %6, <i32 5, i32 5, i32 5, i32 5, i32 5, i32 5, i32 5, i32 5>
    %8 = getelementptr inbounds i32* %A, i64 %index
    %9 = bitcast i32* %8 to <8 x i32>*
+  ;CHECK: cost of 2 {{.*}} load
    %10 = load <8 x i32>* %9, align 4
    ;CHECK: cost of 4 {{.*}} add
    %11 = add nsw <8 x i32> %10, %7
-  ;CHECK: cost of 1 {{.*}} store
+  ;CHECK: cost of 2 {{.*}} store
    store <8 x i32> %11, <8 x i32>* %9, align 4
    %index.next = add i64 %index, 8
    %12 = icmp eq i64 %index.next, %end.idx.rnd.down