Home | History | Annotate | Download | only in DependenceAnalysis
      1 ; RUN: opt < %s -analyze -basicaa -da -da-delinearize=false | FileCheck %s
      2 ; RUN: opt < %s -analyze -basicaa -da -da-delinearize | FileCheck %s -check-prefix=DELIN
      3 
      4 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
      5 target triple = "x86_64-apple-macosx10.6.0"
      6 
      7 ; for (int i = 0; i < 100; ++i) {
      8 ;   int t0 = a[i][i];
      9 ;   int t1 = t0 + 1;
     10 ;   a[i][5] = t1;
     11 ; }
     12 ; The subscript 5 in a[i][5] is deliberately an i32, mismatching the types of
     13 ; other subscript. DependenceAnalysis before the fix crashed due to this
     14 ; mismatch.
     15 define void @i32_subscript([100 x [100 x i32]]* %a, i32* %b) {
     16 ; CHECK-LABEL: 'Dependence Analysis' for function 'i32_subscript'
     17 ; DELIN-LABEL: 'Dependence Analysis' for function 'i32_subscript'
     18 entry:
     19   br label %for.body
     20 
     21 for.body:
     22 ; CHECK: da analyze - none!
     23 ; CHECK: da analyze - anti [=|<]!
     24 ; CHECK: da analyze - none!
     25 ; DELIN: da analyze - none!
     26 ; DELIN: da analyze - anti [=|<]!
     27 ; DELIN: da analyze - none!
     28   %i = phi i64 [ 0, %entry ], [ %i.inc, %for.body ]
     29   %a.addr = getelementptr [100 x [100 x i32]], [100 x [100 x i32]]* %a, i64 0, i64 %i, i64 %i
     30   %a.addr.2 = getelementptr [100 x [100 x i32]], [100 x [100 x i32]]* %a, i64 0, i64 %i, i32 5
     31   %0 = load i32, i32* %a.addr, align 4
     32   %1 = add i32 %0, 1
     33   store i32 %1, i32* %a.addr.2, align 4
     34   %i.inc = add nsw i64 %i, 1
     35   %exitcond = icmp ne i64 %i.inc, 100
     36   br i1 %exitcond, label %for.body, label %for.end
     37 
     38 for.end:
     39   ret void
     40 }
     41 
     42 target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
     43 target triple = "x86_64-unknown-linux-gnu"
     44 
     45 ;  unsigned i, j;
     46 ;  for (i = 1; i < SIZE; i++) {
     47 ;    for (j = i; j < SIZE; j++) {
     48 ;      a[i][j] = a[i+1][j-1] + 2;
     49 ;    }
     50 ;  }
     51 ;  Extends the previous example to coupled MIV subscripts.
     52 
     53 
     54 @a = global [10004 x [10004 x i32]] zeroinitializer, align 16
     55 
     56 ; Function Attrs: nounwind uwtable
     57 define void @coupled_miv_type_mismatch(i32 %n) #0 {
     58 ; CHECK-LABEL: 'Dependence Analysis' for function 'coupled_miv_type_mismatch'
     59 ; DELIN-LABEL: 'Dependence Analysis' for function 'coupled_miv_type_mismatch'
     60 entry:
     61   br label %for.cond
     62 
     63 ; CHECK: da analyze - input [0 *]!
     64 ; CHECK: da analyze - anti [1 *]!
     65 ; CHECK: da analyze - none!
     66 ; DELIN: da analyze - input [0 *]!
     67 ; DELIN: da analyze - anti [1 *]!
     68 ; DELIN: da analyze - none!
     69 for.cond:                                         ; preds = %for.inc11, %entry
     70   %indvars.iv11 = phi i64 [ %indvars.iv.next12, %for.inc11 ], [ 1, %entry ]
     71   %exitcond14 = icmp ne i64 %indvars.iv11, 10000
     72   br i1 %exitcond14, label %for.cond1.preheader, label %for.end13
     73 
     74 for.cond1.preheader:                              ; preds = %for.cond
     75   %0 = trunc i64 %indvars.iv11 to i32
     76   br label %for.cond1
     77 
     78 for.cond1:                                        ; preds = %for.cond1.preheader, %for.body3
     79   %indvars.iv8 = phi i64 [ %indvars.iv11, %for.cond1.preheader ], [ %indvars.iv.next9, %for.body3 ]
     80   %j.0 = phi i32 [ %inc, %for.body3 ], [ %0, %for.cond1.preheader ]
     81   %lftr.wideiv = trunc i64 %indvars.iv8 to i32
     82   %exitcond = icmp ne i32 %lftr.wideiv, 10000
     83   br i1 %exitcond, label %for.body3, label %for.inc11
     84 
     85 for.body3:                                        ; preds = %for.cond1
     86   %sub = add nsw i32 %j.0, -1
     87   %idxprom = zext i32 %sub to i64
     88   %1 = add nuw nsw i64 %indvars.iv11, 1
     89   %arrayidx5 = getelementptr inbounds [10004 x [10004 x i32]], [10004 x [10004 x i32]]* @a, i64 0, i64 %1, i64 %idxprom
     90   %2 = load i32, i32* %arrayidx5, align 4
     91   %add6 = add nsw i32 %2, 2
     92   %arrayidx10 = getelementptr inbounds [10004 x [10004 x i32]], [10004 x [10004 x i32]]* @a, i64 0, i64 %indvars.iv11, i64 %indvars.iv8
     93   store i32 %add6, i32* %arrayidx10, align 4
     94   %indvars.iv.next9 = add nuw nsw i64 %indvars.iv8, 1
     95   %inc = add nuw nsw i32 %j.0, 1
     96   br label %for.cond1
     97 
     98 for.inc11:                                        ; preds = %for.cond1
     99   %indvars.iv.next12 = add nuw nsw i64 %indvars.iv11, 1
    100   br label %for.cond
    101 
    102 for.end13:                                        ; preds = %for.cond
    103   ret void
    104 }
    105 
    106 attributes #0 = { nounwind uwtable "less-precise-fpmad"="false" "no-frame-pointer-elim"="true" "no-frame-pointer-elim-non-leaf" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "target-cpu"="x86-64" "target-features"="+sse,+sse2" "unsafe-fp-math"="false" "use-soft-float"="false" }
    107 
    108 !llvm.ident = !{!0}
    109 
    110 !0 = !{!"clang version 3.7.0 (https://vaivaswatha@bitbucket.org/compilertree/amd_clang.git 93a05fb75ee3411d24e8b2b184fc766a5318403e) (https://vaivaswatha@bitbucket.org/compilertree/amd_llvm.git 166d93d26efc912b517739f64d054a435e8e95cd)"}
    111