Home | History | Annotate | Download | only in LoopAccessAnalysis
      1 ; RUN: opt -basicaa -loop-accesses -analyze < %s | FileCheck %s
      2 
      3 target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"
      4 
      5 ; i and i + 1 can overflow in the following kernel:
      6 ; void test1(unsigned long long x, int *a, int *b) {
      7 ;  for (unsigned i = 0; i < x; ++i)
      8 ;    b[i] = a[i+1] + 1;
      9 ; }
     10 ;
     11 ; If accesses to a and b can alias, we need to emit a run-time alias check
     12 ; between accesses to a and b. However, when i and i + 1 can wrap, their
     13 ; SCEV expression is not an AddRec. We need to create SCEV predicates and
     14 ; coerce the expressions to AddRecs in order to be able to emit the run-time
     15 ; alias check.
     16 ;
     17 ; The accesses at b[i] and a[i+1] correspond to the addresses %arrayidx and
     18 ; %arrayidx4 in the test. The SCEV expressions for these are:
     19 ;  ((4 * (zext i32 {1,+,1}<%for.body> to i64))<nuw><nsw> + %a)<nsw>
     20 ;  ((4 * (zext i32 {0,+,1}<%for.body> to i64))<nuw><nsw> + %b)<nsw>
     21 ;
     22 ; The transformed expressions are:
     23 ;  i64 {(4 + %a),+,4}<%for.body>
     24 ;  i64 {(4 + %b),+,4}<%for.body>
     25 
     26 ; CHECK-LABEL: test1
     27 ; CHECK:         Memory dependences are safe with run-time checks
     28 ; CHECK-NEXT:    Dependences:
     29 ; CHECK-NEXT:    Run-time memory checks:
     30 ; CHECK-NEXT:    Check 0:
     31 ; CHECK-NEXT:      Comparing group
     32 ; CHECK-NEXT:        %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
     33 ; CHECK-NEXT:      Against group
     34 ; CHECK-NEXT:        %arrayidx4 = getelementptr inbounds i32, i32* %b, i64 %conv11
     35 ; CHECK-NEXT:    Grouped accesses:
     36 ; CHECK-NEXT:      Group
     37 ; CHECK-NEXT:        (Low: (4 + %a) High: (4 + (4 * (1 umax %x)) + %a))
     38 ; CHECK-NEXT:          Member: {(4 + %a),+,4}<%for.body>
     39 ; CHECK-NEXT:      Group
     40 ; CHECK-NEXT:        (Low: %b High: ((4 * (1 umax %x)) + %b))
     41 ; CHECK-NEXT:          Member: {%b,+,4}<%for.body>
     42 ; CHECK:         Store to invariant address was not found in loop.
     43 ; CHECK-NEXT:    SCEV assumptions:
     44 ; CHECK-NEXT:    {1,+,1}<%for.body> Added Flags: <nusw>
     45 ; CHECK-NEXT:    {0,+,1}<%for.body> Added Flags: <nusw>
     46 ; CHECK:         Expressions re-written:
     47 ; CHECK-NEXT:    [PSE]  %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom:
     48 ; CHECK-NEXT:      ((4 * (zext i32 {1,+,1}<%for.body> to i64))<nuw><nsw> + %a)<nsw>
     49 ; CHECK-NEXT:      --> {(4 + %a),+,4}<%for.body>
     50 ; CHECK-NEXT:    [PSE]  %arrayidx4 = getelementptr inbounds i32, i32* %b, i64 %conv11:
     51 ; CHECK-NEXT:      ((4 * (zext i32 {0,+,1}<%for.body> to i64))<nuw><nsw> + %b)<nsw>
     52 ; CHECK-NEXT:      --> {%b,+,4}<%for.body>
     53 define void @test1(i64 %x, i32* %a, i32* %b) {
     54 entry:
     55   br label %for.body
     56 
     57 for.body:                                         ; preds = %for.body.preheader, %for.body
     58   %conv11 = phi i64 [ %conv, %for.body ], [ 0, %entry ]
     59   %i.010 = phi i32 [ %add, %for.body ], [ 0, %entry ]
     60   %add = add i32 %i.010, 1
     61   %idxprom = zext i32 %add to i64
     62   %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
     63   %ld = load i32, i32* %arrayidx, align 4
     64   %add2 = add nsw i32 %ld, 1
     65   %arrayidx4 = getelementptr inbounds i32, i32* %b, i64 %conv11
     66   store i32 %add2, i32* %arrayidx4, align 4
     67   %conv = zext i32 %add to i64
     68   %cmp = icmp ult i64 %conv, %x
     69   br i1 %cmp, label %for.body, label %exit
     70 
     71 exit:
     72   ret void
     73 }
     74 
     75 ; i can overflow in the following kernel:
     76 ; void test2(unsigned long long x, int *a) {
     77 ;   for (unsigned i = 0; i < x; ++i)
     78 ;     a[i] = a[i] + 1;
     79 ; }
     80 ;
     81 ; We need to check that i doesn't wrap, but we don't need a run-time alias
     82 ; check. We also need an extra no-wrap check to get the backedge taken count.
     83 
     84 ; CHECK-LABEL: test2
     85 ; CHECK: Memory dependences are safe
     86 ; CHECK: SCEV assumptions:
     87 ; CHECK-NEXT:   {1,+,1}<%for.body> Added Flags: <nusw>
     88 ; CHECK-NEXT:   {0,+,1}<%for.body> Added Flags: <nusw>
     89  define void @test2(i64 %x, i32* %a) {
     90 entry:
     91   br label %for.body
     92 
     93 for.body:
     94   %conv11 = phi i64 [ %conv, %for.body ], [ 0, %entry ]
     95   %i.010 = phi i32 [ %inc, %for.body ], [ 0, %entry ]
     96   %arrayidx = getelementptr inbounds i32, i32* %a, i64 %conv11
     97   %ld = load i32, i32* %arrayidx, align 4
     98   %add = add nsw i32 %ld, 1
     99   store i32 %add, i32* %arrayidx, align 4
    100   %inc = add i32 %i.010, 1
    101   %conv = zext i32 %inc to i64
    102   %cmp = icmp ult i64 %conv, %x
    103   br i1 %cmp, label %for.body, label %exit
    104 
    105 exit:
    106   ret void
    107 }
    108