test/Analysis/DependenceAnalysis/NonCanonicalizedSubscript.ll

   1 ; RUN: opt < %s -analyze -basicaa -da -da-delinearize=false | FileCheck %s
   2 ; RUN: opt < %s -analyze -basicaa -da -da-delinearize | FileCheck %s -check-prefix=DELIN
   3
   4 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
   5 target triple = "x86_64-apple-macosx10.6.0"
   6
   7 ; for (int i = 0; i < 100; ++i) {
   8 ;   int t0 = a[i][i];
   9 ;   int t1 = t0 + 1;
  10 ;   a[i][5] = t1;
  11 ; }
  12 ; The subscript 5 in a[i][5] is deliberately an i32, mismatching the types of
  13 ; other subscript. DependenceAnalysis before the fix crashed due to this
  14 ; mismatch.
  15 define void @i32_subscript([100 x [100 x i32]]* %a, i32* %b) {
  16 ; CHECK-LABEL: 'Dependence Analysis' for function 'i32_subscript'
  17 ; DELIN-LABEL: 'Dependence Analysis' for function 'i32_subscript'
  18 entry:
  19   br label %for.body
  20
  21 for.body:
  22 ; CHECK: da analyze - none!
  23 ; CHECK: da analyze - anti [=|<]!
  24 ; CHECK: da analyze - none!
  25 ; DELIN: da analyze - none!
  26 ; DELIN: da analyze - anti [=|<]!
  27 ; DELIN: da analyze - none!
  28   %i = phi i64 [ 0, %entry ], [ %i.inc, %for.body ]
  29   %a.addr = getelementptr [100 x [100 x i32]], [100 x [100 x i32]]* %a, i64 0, i64 %i, i64 %i
  30   %a.addr.2 = getelementptr [100 x [100 x i32]], [100 x [100 x i32]]* %a, i64 0, i64 %i, i32 5
  31   %0 = load i32, i32* %a.addr, align 4
  32   %1 = add i32 %0, 1
  33   store i32 %1, i32* %a.addr.2, align 4
  34   %i.inc = add nsw i64 %i, 1
  35   %exitcond = icmp ne i64 %i.inc, 100
  36   br i1 %exitcond, label %for.body, label %for.end
  37
  38 for.end:
  39   ret void
  40 }
  41
  42 target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
  43 target triple = "x86_64-unknown-linux-gnu"
  44
  45 ;  unsigned i, j;
  46 ;  for (i = 1; i < SIZE; i++) {
  47 ;    for (j = i; j < SIZE; j++) {
  48 ;      a[i][j] = a[i+1][j-1] + 2;
  49 ;    }
  50 ;  }
  51 ;  Extends the previous example to coupled MIV subscripts.
  52
  53
  54 @a = global [10004 x [10004 x i32]] zeroinitializer, align 16
  55
  56 ; Function Attrs: nounwind uwtable
  57 define void @coupled_miv_type_mismatch(i32 %n) #0 {
  58 ; CHECK-LABEL: 'Dependence Analysis' for function 'coupled_miv_type_mismatch'
  59 ; DELIN-LABEL: 'Dependence Analysis' for function 'coupled_miv_type_mismatch'
  60 entry:
  61   br label %for.cond
  62
  63 ; CHECK: da analyze - input [0 *]!
  64 ; CHECK: da analyze - anti [1 *]!
  65 ; CHECK: da analyze - none!
  66 ; DELIN: da analyze - input [0 *]!
  67 ; DELIN: da analyze - anti [1 *]!
  68 ; DELIN: da analyze - none!
  69 for.cond:                                         ; preds = %for.inc11, %entry
  70   %indvars.iv11 = phi i64 [ %indvars.iv.next12, %for.inc11 ], [ 1, %entry ]
  71   %exitcond14 = icmp ne i64 %indvars.iv11, 10000
  72   br i1 %exitcond14, label %for.cond1.preheader, label %for.end13
  73
  74 for.cond1.preheader:                              ; preds = %for.cond
  75   %0 = trunc i64 %indvars.iv11 to i32
  76   br label %for.cond1
  77
  78 for.cond1:                                        ; preds = %for.cond1.preheader, %for.body3
  79   %indvars.iv8 = phi i64 [ %indvars.iv11, %for.cond1.preheader ], [ %indvars.iv.next9, %for.body3 ]
  80   %j.0 = phi i32 [ %inc, %for.body3 ], [ %0, %for.cond1.preheader ]
  81   %lftr.wideiv = trunc i64 %indvars.iv8 to i32
  82   %exitcond = icmp ne i32 %lftr.wideiv, 10000
  83   br i1 %exitcond, label %for.body3, label %for.inc11
  84
  85 for.body3:                                        ; preds = %for.cond1
  86   %sub = add nsw i32 %j.0, -1
  87   %idxprom = zext i32 %sub to i64
  88   %1 = add nuw nsw i64 %indvars.iv11, 1
  89   %arrayidx5 = getelementptr inbounds [10004 x [10004 x i32]], [10004 x [10004 x i32]]* @a, i64 0, i64 %1, i64 %idxprom
  90   %2 = load i32, i32* %arrayidx5, align 4
  91   %add6 = add nsw i32 %2, 2
  92   %arrayidx10 = getelementptr inbounds [10004 x [10004 x i32]], [10004 x [10004 x i32]]* @a, i64 0, i64 %indvars.iv11, i64 %indvars.iv8
  93   store i32 %add6, i32* %arrayidx10, align 4
  94   %indvars.iv.next9 = add nuw nsw i64 %indvars.iv8, 1
  95   %inc = add nuw nsw i32 %j.0, 1
  96   br label %for.cond1
  97
  98 for.inc11:                                        ; preds = %for.cond1
  99   %indvars.iv.next12 = add nuw nsw i64 %indvars.iv11, 1
 100   br label %for.cond
 101
 102 for.end13:                                        ; preds = %for.cond
 103   ret void
 104 }
 105
 106 attributes #0 = { nounwind uwtable "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+sse,+sse2" "unsafe-fp-math"="false" "use-soft-float"="false" }
 107
 108 !llvm.ident = !{!0}
 109
 110 !0 = !{!"clang version 3.7.0 (https://vaivaswatha@bitbucket.org/compilertree/amd_clang.git 93a05fb75ee3411d24e8b2b184fc766a5318403e) (https://vaivaswatha@bitbucket.org/compilertree/amd_llvm.git 166d93d26efc912b517739f64d054a435e8e95cd)"}