Home | History | Annotate | Download | only in NVPTX
      1 ; RUN: opt < %s -nary-reassociate -early-cse -S | FileCheck %s
      2 
      3 target datalayout = "e-i64:64-v16:16-v32:32-n16:32:64"
      4 target triple = "nvptx64-unknown-unknown"
      5 
      6 declare void @foo(float*)
      7 
      8 ; foo(&a[i]);
      9 ; foo(&a[i + j]);
     10 ;   =>
     11 ; t = &a[i];
     12 ; foo(t);
     13 ; foo(t + j);
     14 define void @reassociate_gep(float* %a, i64 %i, i64 %j) {
     15 ; CHECK-LABEL: @reassociate_gep(
     16   %1 = add i64 %i, %j
     17   %2 = getelementptr float, float* %a, i64 %i
     18 ; CHECK: [[t1:[^ ]+]] = getelementptr float, float* %a, i64 %i
     19   call void @foo(float* %2)
     20 ; CHECK: call void @foo(float* [[t1]])
     21   %3 = getelementptr float, float* %a, i64 %1
     22 ; CHECK: [[t2:[^ ]+]] = getelementptr float, float* [[t1]], i64 %j
     23   call void @foo(float* %3)
     24 ; CHECK: call void @foo(float* [[t2]])
     25   ret void
     26 }
     27 
     28 ; foo(&a[sext(j)]);
     29 ; foo(&a[sext(i +nsw j)]);
     30 ; foo(&a[sext((i +nsw j) +nsw i)]);
     31 ;   =>
     32 ; t1 = &a[sext(j)];
     33 ; foo(t1);
     34 ; t2 = t1 + sext(i);
     35 ; foo(t2);
     36 ; t3 = t2 + sext(i); // sext(i) should be GVN'ed.
     37 ; foo(t3);
     38 define void @reassociate_gep_nsw(float* %a, i32 %i, i32 %j) {
     39 ; CHECK-LABEL: @reassociate_gep_nsw(
     40   %idxprom.j = sext i32 %j to i64
     41   %1 = getelementptr float, float* %a, i64 %idxprom.j
     42 ; CHECK: [[t1:[^ ]+]] = getelementptr float, float* %a, i64 %idxprom.j
     43   call void @foo(float* %1)
     44 ; CHECK: call void @foo(float* [[t1]])
     45 
     46   %2 = add nsw i32 %i, %j
     47   %idxprom.2 = sext i32 %2 to i64
     48   %3 = getelementptr float, float* %a, i64 %idxprom.2
     49 ; CHECK: [[sexti:[^ ]+]] = sext i32 %i to i64
     50 ; CHECK: [[t2:[^ ]+]] = getelementptr float, float* [[t1]], i64 [[sexti]]
     51   call void @foo(float* %3)
     52 ; CHECK: call void @foo(float* [[t2]])
     53 
     54   %4 = add nsw i32 %2, %i
     55   %idxprom.4 = sext i32 %4 to i64
     56   %5 = getelementptr float, float* %a, i64 %idxprom.4
     57 ; CHECK: [[t3:[^ ]+]] = getelementptr float, float* [[t2]], i64 [[sexti]]
     58   call void @foo(float* %5)
     59 ; CHECK: call void @foo(float* [[t3]])
     60 
     61   ret void
     62 }
     63 
     64 ; assume(j >= 0);
     65 ; foo(&a[zext(j)]);
     66 ; assume(i + j >= 0);
     67 ; foo(&a[zext(i + j)]);
     68 ;   =>
     69 ; t1 = &a[zext(j)];
     70 ; foo(t1);
     71 ; t2 = t1 + sext(i);
     72 ; foo(t2);
     73 define void @reassociate_gep_assume(float* %a, i32 %i, i32 %j) {
     74 ; CHECK-LABEL: @reassociate_gep_assume(
     75   ; assume(j >= 0)
     76   %cmp = icmp sgt i32 %j, -1
     77   call void @llvm.assume(i1 %cmp)
     78   %1 = add i32 %i, %j
     79   %cmp2 = icmp sgt i32 %1, -1
     80   call void @llvm.assume(i1 %cmp2)
     81 
     82   %idxprom.j = zext i32 %j to i64
     83   %2 = getelementptr float, float* %a, i64 %idxprom.j
     84 ; CHECK: [[t1:[^ ]+]] = getelementptr float, float* %a, i64 %idxprom.j
     85   call void @foo(float* %2)
     86 ; CHECK: call void @foo(float* [[t1]])
     87 
     88   %idxprom.1 = zext i32 %1 to i64
     89   %3 = getelementptr float, float* %a, i64 %idxprom.1
     90 ; CHECK: [[sexti:[^ ]+]] = sext i32 %i to i64
     91 ; CHECK: [[t2:[^ ]+]] = getelementptr float, float* [[t1]], i64 [[sexti]]
     92   call void @foo(float* %3)
     93 ; CHECK: call void @foo(float* [[t2]])
     94 
     95   ret void
     96 }
     97 
     98 ; Do not split the second GEP because sext(i + j) != sext(i) + sext(j).
     99 define void @reassociate_gep_no_nsw(float* %a, i32 %i, i32 %j) {
    100 ; CHECK-LABEL: @reassociate_gep_no_nsw(
    101   %1 = add i32 %i, %j
    102   %2 = getelementptr float, float* %a, i32 %j
    103 ; CHECK: getelementptr float, float* %a, i32 %j
    104   call void @foo(float* %2)
    105   %3 = getelementptr float, float* %a, i32 %1
    106 ; CHECK: getelementptr float, float* %a, i32 %1
    107   call void @foo(float* %3)
    108   ret void
    109 }
    110 
    111 define void @reassociate_gep_128(float* %a, i128 %i, i128 %j) {
    112 ; CHECK-LABEL: @reassociate_gep_128(
    113   %1 = add i128 %i, %j
    114   %2 = getelementptr float, float* %a, i128 %i
    115 ; CHECK: [[t1:[^ ]+]] = getelementptr float, float* %a, i128 %i
    116   call void @foo(float* %2)
    117 ; CHECK: call void @foo(float* [[t1]])
    118   %3 = getelementptr float, float* %a, i128 %1
    119 ; CHECK: [[truncj:[^ ]+]] = trunc i128 %j to i64
    120 ; CHECK: [[t2:[^ ]+]] = getelementptr float, float* [[t1]], i64 [[truncj]]
    121   call void @foo(float* %3)
    122 ; CHECK: call void @foo(float* [[t2]])
    123   ret void
    124 }
    125 
    126 %struct.complex = type { float, float }
    127 
    128 declare void @bar(%struct.complex*)
    129 
    130 define void @different_types(%struct.complex* %input, i64 %i) {
    131 ; CHECK-LABEL: @different_types(
    132   %t1 = getelementptr %struct.complex, %struct.complex* %input, i64 %i
    133   call void @bar(%struct.complex* %t1)
    134   %j = add i64 %i, 5
    135   %t2 = getelementptr %struct.complex, %struct.complex* %input, i64 %j, i32 0
    136 ; CHECK: [[cast:[^ ]+]] = bitcast %struct.complex* %t1 to float*
    137 ; CHECK-NEXT: %t2 = getelementptr float, float* [[cast]], i64 10
    138 ; CHECK-NEXT: call void @foo(float* %t2)
    139   call void @foo(float* %t2)
    140   ret void
    141 }
    142 
    143 declare void @llvm.assume(i1)
    144