1 ; RUN: opt < %s -analyze -basicaa -da -da-delinearize=false | FileCheck %s
2 ; RUN: opt < %s -analyze -basicaa -da -da-delinearize | FileCheck %s -check-prefix=DELIN
4 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
5 target triple = "x86_64-apple-macosx10.6.0"
7 ; for (int i = 0; i < 100; ++i) {
12 ; The subscript 5 in a[i][5] is deliberately an i32, mismatching the types of
13 ; other subscript. DependenceAnalysis before the fix crashed due to this
15 define void @i32_subscript([100 x [100 x i32]]* %a, i32* %b) {
16 ; CHECK-LABEL: 'Dependence Analysis' for function 'i32_subscript'
17 ; DELIN-LABEL: 'Dependence Analysis' for function 'i32_subscript'
22 ; CHECK: da analyze - none!
23 ; CHECK: da analyze - anti [=|<]!
24 ; CHECK: da analyze - none!
25 ; DELIN: da analyze - none!
26 ; DELIN: da analyze - anti [=|<]!
27 ; DELIN: da analyze - none!
28 %i = phi i64 [ 0, %entry ], [ %i.inc, %for.body ]
29 %a.addr = getelementptr [100 x [100 x i32]], [100 x [100 x i32]]* %a, i64 0, i64 %i, i64 %i
30 %a.addr.2 = getelementptr [100 x [100 x i32]], [100 x [100 x i32]]* %a, i64 0, i64 %i, i32 5
31 %0 = load i32, i32* %a.addr, align 4
33 store i32 %1, i32* %a.addr.2, align 4
34 %i.inc = add nsw i64 %i, 1
35 %exitcond = icmp ne i64 %i.inc, 100
36 br i1 %exitcond, label %for.body, label %for.end
42 target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
43 target triple = "x86_64-unknown-linux-gnu"
46 ; for (i = 1; i < SIZE; i++) {
47 ; for (j = i; j < SIZE; j++) {
48 ; a[i][j] = a[i+1][j-1] + 2;
51 ; Extends the previous example to coupled MIV subscripts.
54 @a = global [10004 x [10004 x i32]] zeroinitializer, align 16
56 ; Function Attrs: nounwind uwtable
57 define void @coupled_miv_type_mismatch(i32 %n) #0 {
58 ; CHECK-LABEL: 'Dependence Analysis' for function 'coupled_miv_type_mismatch'
59 ; DELIN-LABEL: 'Dependence Analysis' for function 'coupled_miv_type_mismatch'
63 ; CHECK: da analyze - input [0 *]!
64 ; CHECK: da analyze - anti [1 *]!
65 ; CHECK: da analyze - none!
66 ; DELIN: da analyze - input [0 *]!
67 ; DELIN: da analyze - anti [1 *]!
68 ; DELIN: da analyze - none!
69 for.cond: ; preds = %for.inc11, %entry
70 %indvars.iv11 = phi i64 [ %indvars.iv.next12, %for.inc11 ], [ 1, %entry ]
71 %exitcond14 = icmp ne i64 %indvars.iv11, 10000
72 br i1 %exitcond14, label %for.cond1.preheader, label %for.end13
74 for.cond1.preheader: ; preds = %for.cond
75 %0 = trunc i64 %indvars.iv11 to i32
78 for.cond1: ; preds = %for.cond1.preheader, %for.body3
79 %indvars.iv8 = phi i64 [ %indvars.iv11, %for.cond1.preheader ], [ %indvars.iv.next9, %for.body3 ]
80 %j.0 = phi i32 [ %inc, %for.body3 ], [ %0, %for.cond1.preheader ]
81 %lftr.wideiv = trunc i64 %indvars.iv8 to i32
82 %exitcond = icmp ne i32 %lftr.wideiv, 10000
83 br i1 %exitcond, label %for.body3, label %for.inc11
85 for.body3: ; preds = %for.cond1
86 %sub = add nsw i32 %j.0, -1
87 %idxprom = zext i32 %sub to i64
88 %1 = add nuw nsw i64 %indvars.iv11, 1
89 %arrayidx5 = getelementptr inbounds [10004 x [10004 x i32]], [10004 x [10004 x i32]]* @a, i64 0, i64 %1, i64 %idxprom
90 %2 = load i32, i32* %arrayidx5, align 4
91 %add6 = add nsw i32 %2, 2
92 %arrayidx10 = getelementptr inbounds [10004 x [10004 x i32]], [10004 x [10004 x i32]]* @a, i64 0, i64 %indvars.iv11, i64 %indvars.iv8
93 store i32 %add6, i32* %arrayidx10, align 4
94 %indvars.iv.next9 = add nuw nsw i64 %indvars.iv8, 1
95 %inc = add nuw nsw i32 %j.0, 1
98 for.inc11: ; preds = %for.cond1
99 %indvars.iv.next12 = add nuw nsw i64 %indvars.iv11, 1
102 for.end13: ; preds = %for.cond
106 attributes #0 = { nounwind uwtable "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+sse,+sse2" "unsafe-fp-math"="false" "use-soft-float"="false" }
110 !0 = !{!"clang version 3.7.0 (https://vaivaswatha@bitbucket.org/compilertree/amd_clang.git 93a05fb75ee3411d24e8b2b184fc766a5318403e) (https://vaivaswatha@bitbucket.org/compilertree/amd_llvm.git 166d93d26efc912b517739f64d054a435e8e95cd)"}