Home | History | Annotate | Download | only in OpenMP
      1 // RUN: %clang_cc1 -fopenmp=libiomp5 -triple x86_64-unknown-unknown -emit-llvm %s -o - | FileCheck %s -check-prefix=CHECK -check-prefix=NORMAL
      2 // RUN: %clang_cc1 -fopenmp=libiomp5 -triple powerpc64-unknown-unknown -emit-llvm %s -o - | FileCheck %s -check-prefix=CHECK -check-prefix=NORMAL
      3 // RUN: %clang_cc1 -fopenmp=libiomp5 -triple powerpc64-unknown-unknown -target-abi elfv1-qpx -emit-llvm %s -o - | FileCheck %s -check-prefix=CHECK -check-prefix=QPX
      4 
      5 void h1(float *c, float *a, double b[], int size)
      6 {
      7 // CHECK-LABEL: define void @h1
      8   int t = 0;
      9 #pragma omp simd safelen(16) linear(t) aligned(c:32) aligned(a,b)
     10 // CHECK:         [[C_PTRINT:%.+]] = ptrtoint
     11 // CHECK-NEXT:    [[C_MASKEDPTR:%.+]] = and i{{[0-9]+}} [[C_PTRINT]], 31
     12 // CHECK-NEXT:    [[C_MASKCOND:%.+]] = icmp eq i{{[0-9]+}} [[C_MASKEDPTR]], 0
     13 // CHECK-NEXT:    call void @llvm.assume(i1 [[C_MASKCOND]])
     14 // CHECK:         [[A_PTRINT:%.+]] = ptrtoint
     15 // CHECK-NEXT:    [[A_MASKEDPTR:%.+]] = and i{{[0-9]+}} [[A_PTRINT]], 15
     16 // CHECK-NEXT:    [[A_MASKCOND:%.+]] = icmp eq i{{[0-9]+}} [[A_MASKEDPTR]], 0
     17 // CHECK-NEXT:    call void @llvm.assume(i1 [[A_MASKCOND]])
     18 // CHECK:         [[B_PTRINT:%.+]] = ptrtoint
     19 // NORMAL-NEXT:    [[B_MASKEDPTR:%.+]] = and i{{[0-9]+}} [[B_PTRINT]], 15
     20 // QPX-NEXT:    [[B_MASKEDPTR:%.+]] = and i{{[0-9]+}} [[B_PTRINT]], 31
     21 // CHECK-NEXT:    [[B_MASKCOND:%.+]] = icmp eq i{{[0-9]+}} [[B_MASKEDPTR]], 0
     22 // CHECK-NEXT:    call void @llvm.assume(i1 [[B_MASKCOND]])
     23   for (int i = 0; i < size; ++i) {
     24     c[i] = a[i] * a[i] + b[i] * b[t];
     25     ++t;
     26 // do not emit parallel_loop_access metadata due to usage of safelen clause.
     27 // CHECK-NOT: store float {{.+}}, float* {{.+}}, align {{.+}}, !llvm.mem.parallel_loop_access {{![0-9]+}}
     28   }
     29 }
     30 
     31 void h2(float *c, float *a, float *b, int size)
     32 {
     33 // CHECK-LABEL: define void @h2
     34   int t = 0;
     35 #pragma omp simd linear(t)
     36   for (int i = 0; i < size; ++i) {
     37     c[i] = a[i] * a[i] + b[i] * b[t];
     38     ++t;
     39 // CHECK: store float {{.+}}, float* {{.+}}, align {{.+}}, !llvm.mem.parallel_loop_access [[LOOP_H2_HEADER:![0-9]+]]
     40   }
     41 }
     42 
     43 void h3(float *c, float *a, float *b, int size)
     44 {
     45 // CHECK-LABEL: define void @h3
     46 #pragma omp simd
     47   for (int i = 0; i < size; ++i) {
     48     for (int j = 0; j < size; ++j) {
     49       c[j*i] = a[i] * b[j];
     50     }
     51   }
     52 // do not emit parallel_loop_access for nested loop.
     53 // CHECK-NOT: store float {{.+}}, float* {{.+}}, align {{.+}}, !llvm.mem.parallel_loop_access {{![0-9]+}}
     54 }
     55 
     56 // Metadata for h1:
     57 // CHECK: [[LOOP_H1_HEADER:![0-9]+]] = distinct !{[[LOOP_H1_HEADER]], [[LOOP_WIDTH_16:![0-9]+]], [[LOOP_VEC_ENABLE:![0-9]+]]}
     58 // CHECK: [[LOOP_WIDTH_16]] = !{!"llvm.loop.vectorize.width", i32 16}
     59 // CHECK: [[LOOP_VEC_ENABLE]] = !{!"llvm.loop.vectorize.enable", i1 true}
     60 //
     61 // Metadata for h2:
     62 // CHECK: [[LOOP_H2_HEADER]] = distinct !{[[LOOP_H2_HEADER]], [[LOOP_VEC_ENABLE]]}
     63 //
     64 // Metadata for h3:
     65 // CHECK: [[LOOP_H3_HEADER:![0-9]+]] = distinct !{[[LOOP_H3_HEADER]], [[LOOP_VEC_ENABLE]]}
     66 //
     67