Home | History | Annotate | Download | only in CodeGen
      1 // RUN: %clang_cc1 %s -emit-llvm -o - -triple=armv7-apple-ios -std=c11 | FileCheck %s
      2 
      3 // There isn't really anything special about iOS; it just happens to
      4 // only deploy on processors with native atomics support, so it's a good
      5 // way to test those code-paths.
      6 
      7 // This work was done in pursuit of <rdar://13338582>.
      8 
      9 // CHECK: define arm_aapcscc void @testFloat(float*
     10 void testFloat(_Atomic(float) *fp) {
     11 // CHECK:      [[FP:%.*]] = alloca float*
     12 // CHECK-NEXT: [[X:%.*]] = alloca float
     13 // CHECK-NEXT: [[F:%.*]] = alloca float
     14 // CHECK-NEXT: store float* {{%.*}}, float** [[FP]]
     15 
     16 // CHECK-NEXT: [[T0:%.*]] = load float** [[FP]]
     17 // CHECK-NEXT: store float 1.000000e+00, float* [[T0]], align 4
     18   __c11_atomic_init(fp, 1.0f);
     19 
     20 // CHECK-NEXT: store float 2.000000e+00, float* [[X]], align 4
     21   _Atomic(float) x = 2.0f;
     22 
     23 // CHECK-NEXT: [[T0:%.*]] = load float** [[FP]]
     24 // CHECK-NEXT: [[T1:%.*]] = bitcast float* [[T0]] to i32*
     25 // CHECK-NEXT: [[T2:%.*]] = load atomic i32* [[T1]] seq_cst, align 4
     26 // CHECK-NEXT: [[T3:%.*]] = bitcast i32 [[T2]] to float
     27 // CHECK-NEXT: store float [[T3]], float* [[F]]
     28   float f = *fp;
     29 
     30 // CHECK-NEXT: [[T0:%.*]] = load float* [[F]], align 4
     31 // CHECK-NEXT: [[T1:%.*]] = load float** [[FP]], align 4
     32 // CHECK-NEXT: [[T2:%.*]] = bitcast float [[T0]] to i32
     33 // CHECK-NEXT: [[T3:%.*]] = bitcast float* [[T1]] to i32*
     34 // CHECK-NEXT: store atomic i32 [[T2]], i32* [[T3]] seq_cst, align 4
     35   *fp = f;
     36 
     37 // CHECK-NEXT: ret void
     38 }
     39 
     40 // CHECK: define arm_aapcscc void @testComplexFloat([[CF:{ float, float }]]*
     41 void testComplexFloat(_Atomic(_Complex float) *fp) {
     42 // CHECK:      [[FP:%.*]] = alloca [[CF]]*, align 4
     43 // CHECK-NEXT: [[X:%.*]] = alloca [[CF]], align 8
     44 // CHECK-NEXT: [[F:%.*]] = alloca [[CF]], align 4
     45 // CHECK-NEXT: [[TMP0:%.*]] = alloca [[CF]], align 8
     46 // CHECK-NEXT: [[TMP1:%.*]] = alloca [[CF]], align 8
     47 // CHECK-NEXT: store [[CF]]*
     48 
     49 // CHECK-NEXT: [[P:%.*]] = load [[CF]]** [[FP]]
     50 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]]* [[P]], i32 0, i32 0
     51 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[CF]]* [[P]], i32 0, i32 1
     52 // CHECK-NEXT: store float 1.000000e+00, float* [[T0]]
     53 // CHECK-NEXT: store float 0.000000e+00, float* [[T1]]
     54   __c11_atomic_init(fp, 1.0f);
     55 
     56 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]]* [[X]], i32 0, i32 0
     57 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[CF]]* [[X]], i32 0, i32 1
     58 // CHECK-NEXT: store float 2.000000e+00, float* [[T0]]
     59 // CHECK-NEXT: store float 0.000000e+00, float* [[T1]]
     60   _Atomic(_Complex float) x = 2.0f;
     61 
     62 // CHECK-NEXT: [[T0:%.*]] = load [[CF]]** [[FP]]
     63 // CHECK-NEXT: [[T1:%.*]] = bitcast [[CF]]* [[T0]] to i64*
     64 // CHECK-NEXT: [[T2:%.*]] = load atomic i64* [[T1]] seq_cst, align 8
     65 // CHECK-NEXT: [[T3:%.*]] = bitcast [[CF]]* [[TMP0]] to i64*
     66 // CHECK-NEXT: store i64 [[T2]], i64* [[T3]], align 8
     67 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]]* [[TMP0]], i32 0, i32 0
     68 // CHECK-NEXT: [[R:%.*]] = load float* [[T0]]
     69 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]]* [[TMP0]], i32 0, i32 1
     70 // CHECK-NEXT: [[I:%.*]] = load float* [[T0]]
     71 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]]* [[F]], i32 0, i32 0
     72 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[CF]]* [[F]], i32 0, i32 1
     73 // CHECK-NEXT: store float [[R]], float* [[T0]]
     74 // CHECK-NEXT: store float [[I]], float* [[T1]]
     75   _Complex float f = *fp;
     76 
     77 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]]* [[F]], i32 0, i32 0
     78 // CHECK-NEXT: [[R:%.*]] = load float* [[T0]]
     79 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]]* [[F]], i32 0, i32 1
     80 // CHECK-NEXT: [[I:%.*]] = load float* [[T0]]
     81 // CHECK-NEXT: [[DEST:%.*]] = load [[CF]]** [[FP]], align 4
     82 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[CF]]* [[TMP1]], i32 0, i32 0
     83 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[CF]]* [[TMP1]], i32 0, i32 1
     84 // CHECK-NEXT: store float [[R]], float* [[T0]]
     85 // CHECK-NEXT: store float [[I]], float* [[T1]]
     86 // CHECK-NEXT: [[T0:%.*]] = bitcast [[CF]]* [[TMP1]] to i64*
     87 // CHECK-NEXT: [[T1:%.*]] = load i64* [[T0]], align 8
     88 // CHECK-NEXT: [[T2:%.*]] = bitcast [[CF]]* [[DEST]] to i64*
     89 // CHECK-NEXT: store atomic i64 [[T1]], i64* [[T2]] seq_cst, align 8
     90   *fp = f;
     91 
     92 // CHECK-NEXT: ret void
     93 }
     94 
     95 typedef struct { short x, y, z, w; } S;
     96 // CHECK: define arm_aapcscc void @testStruct([[S:.*]]*
     97 void testStruct(_Atomic(S) *fp) {
     98 // CHECK:      [[FP:%.*]] = alloca [[S]]*, align 4
     99 // CHECK-NEXT: [[X:%.*]] = alloca [[S]], align 8
    100 // CHECK-NEXT: [[F:%.*]] = alloca [[S:%.*]], align 2
    101 // CHECK-NEXT: [[TMP0:%.*]] = alloca [[S]], align 8
    102 // CHECK-NEXT: store [[S]]*
    103 
    104 // CHECK-NEXT: [[P:%.*]] = load [[S]]** [[FP]]
    105 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]]* [[P]], i32 0, i32 0
    106 // CHECK-NEXT: store i16 1, i16* [[T0]], align 2
    107 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]]* [[P]], i32 0, i32 1
    108 // CHECK-NEXT: store i16 2, i16* [[T0]], align 2
    109 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]]* [[P]], i32 0, i32 2
    110 // CHECK-NEXT: store i16 3, i16* [[T0]], align 2
    111 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]]* [[P]], i32 0, i32 3
    112 // CHECK-NEXT: store i16 4, i16* [[T0]], align 2
    113   __c11_atomic_init(fp, (S){1,2,3,4});
    114 
    115 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]]* [[X]], i32 0, i32 0
    116 // CHECK-NEXT: store i16 1, i16* [[T0]], align 2
    117 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]]* [[X]], i32 0, i32 1
    118 // CHECK-NEXT: store i16 2, i16* [[T0]], align 2
    119 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]]* [[X]], i32 0, i32 2
    120 // CHECK-NEXT: store i16 3, i16* [[T0]], align 2
    121 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[S]]* [[X]], i32 0, i32 3
    122 // CHECK-NEXT: store i16 4, i16* [[T0]], align 2
    123   _Atomic(S) x = (S){1,2,3,4};
    124 
    125 // CHECK-NEXT: [[T0:%.*]] = load [[S]]** [[FP]]
    126 // CHECK-NEXT: [[T1:%.*]] = bitcast [[S]]* [[T0]] to i64*
    127 // CHECK-NEXT: [[T2:%.*]] = load atomic i64* [[T1]] seq_cst, align 8
    128 // CHECK-NEXT: [[T3:%.*]] = bitcast [[S]]* [[F]] to i64*
    129 // CHECK-NEXT: store i64 [[T2]], i64* [[T3]], align 2
    130   S f = *fp;
    131 
    132 // CHECK-NEXT: [[T0:%.*]] = load [[S]]** [[FP]]
    133 // CHECK-NEXT: [[T1:%.*]] = bitcast [[S]]* [[TMP0]] to i8*
    134 // CHECK-NEXT: [[T2:%.*]] = bitcast [[S]]* [[F]] to i8*
    135 // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[T1]], i8* [[T2]], i32 8, i32 2, i1 false)
    136 // CHECK-NEXT: [[T3:%.*]] = bitcast [[S]]* [[TMP0]] to i64*
    137 // CHECK-NEXT: [[T4:%.*]] = load i64* [[T3]], align 8
    138 // CHECK-NEXT: [[T5:%.*]] = bitcast [[S]]* [[T0]] to i64*
    139 // CHECK-NEXT: store atomic i64 [[T4]], i64* [[T5]] seq_cst, align 8
    140   *fp = f;
    141 
    142 // CHECK-NEXT: ret void
    143 }
    144 
    145 typedef struct { short x, y, z; } PS;
    146 // CHECK: define arm_aapcscc void @testPromotedStruct([[APS:.*]]*
    147 void testPromotedStruct(_Atomic(PS) *fp) {
    148 // CHECK:      [[FP:%.*]] = alloca [[APS]]*, align 4
    149 // CHECK-NEXT: [[X:%.*]] = alloca [[APS]], align 8
    150 // CHECK-NEXT: [[F:%.*]] = alloca [[PS:%.*]], align 2
    151 // CHECK-NEXT: [[TMP0:%.*]] = alloca [[APS]], align 8
    152 // CHECK-NEXT: [[TMP1:%.*]] = alloca [[APS]], align 8
    153 // CHECK-NEXT: store [[APS]]*
    154 
    155 // CHECK-NEXT: [[P:%.*]] = load [[APS]]** [[FP]]
    156 // CHECK-NEXT: [[T0:%.*]] = bitcast [[APS]]* [[P]] to i8*
    157 // CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* [[T0]], i8 0, i64 8, i32 8, i1 false)
    158 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[APS]]* [[P]], i32 0, i32 0
    159 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]]* [[T0]], i32 0, i32 0
    160 // CHECK-NEXT: store i16 1, i16* [[T1]], align 2
    161 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]]* [[T0]], i32 0, i32 1
    162 // CHECK-NEXT: store i16 2, i16* [[T1]], align 2
    163 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]]* [[T0]], i32 0, i32 2
    164 // CHECK-NEXT: store i16 3, i16* [[T1]], align 2
    165   __c11_atomic_init(fp, (PS){1,2,3});
    166 
    167 // CHECK-NEXT: [[T0:%.*]] = bitcast [[APS]]* [[X]] to i8*
    168 // CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* [[T0]], i8 0, i32 8, i32 8, i1 false)
    169 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[APS]]* [[X]], i32 0, i32 0
    170 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]]* [[T0]], i32 0, i32 0
    171 // CHECK-NEXT: store i16 1, i16* [[T1]], align 2
    172 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]]* [[T0]], i32 0, i32 1
    173 // CHECK-NEXT: store i16 2, i16* [[T1]], align 2
    174 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[PS]]* [[T0]], i32 0, i32 2
    175 // CHECK-NEXT: store i16 3, i16* [[T1]], align 2
    176   _Atomic(PS) x = (PS){1,2,3};
    177 
    178 // CHECK-NEXT: [[T0:%.*]] = load [[APS]]** [[FP]]
    179 // CHECK-NEXT: [[T1:%.*]] = bitcast [[APS]]* [[T0]] to i64*
    180 // CHECK-NEXT: [[T2:%.*]] = load atomic i64* [[T1]] seq_cst, align 8
    181 // CHECK-NEXT: [[T3:%.*]] = bitcast [[APS]]* [[TMP0]] to i64*
    182 // CHECK-NEXT: store i64 [[T2]], i64* [[T3]], align 2
    183 // CHECK-NEXT: [[T0:%.*]] = getelementptr inbounds [[APS]]* [[TMP0]], i32 0, i32 0
    184 // CHECK-NEXT: [[T1:%.*]] = bitcast [[PS]]* [[F]] to i8*
    185 // CHECK-NEXT: [[T2:%.*]] = bitcast [[PS]]* [[T0]] to i8*
    186 // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[T1]], i8* [[T2]], i32 6, i32 2, i1 false)
    187   PS f = *fp;
    188 
    189 // CHECK-NEXT: [[T0:%.*]] = load [[APS]]** [[FP]]
    190 // CHECK-NEXT: [[T1:%.*]] = bitcast { %struct.PS, [2 x i8] }* [[TMP1]] to i8*
    191 // CHECK-NEXT: call void @llvm.memset.p0i8.i32(i8* [[T1]], i8 0, i32 8, i32 8, i1 false)
    192 // CHECK-NEXT: [[T1:%.*]] = getelementptr inbounds [[APS]]* [[TMP1]], i32 0, i32 0
    193 // CHECK-NEXT: [[T2:%.*]] = bitcast [[PS]]* [[T1]] to i8*
    194 // CHECK-NEXT: [[T3:%.*]] = bitcast [[PS]]* [[F]] to i8*
    195 // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i32(i8* [[T2]], i8* [[T3]], i32 6, i32 2, i1 false)
    196 // CHECK-NEXT: [[T4:%.*]] = bitcast [[APS]]* [[TMP1]] to i64*
    197 // CHECK-NEXT: [[T5:%.*]] = load i64* [[T4]], align 8
    198 // CHECK-NEXT: [[T6:%.*]] = bitcast [[APS]]* [[T0]] to i64*
    199 // CHECK-NEXT: store atomic i64 [[T5]], i64* [[T6]] seq_cst, align 8
    200   *fp = f;
    201 
    202 // CHECK-NEXT: ret void
    203 }
    204 
    205 void testPromotedStructOps(_Atomic(PS) *p) {
    206   PS a = __c11_atomic_load(p, 5);
    207   __c11_atomic_store(p, a, 5);
    208   PS b = __c11_atomic_exchange(p, a, 5);
    209 
    210   _Bool v = __c11_atomic_compare_exchange_strong(p, &b, a, 5, 5);
    211   v = __c11_atomic_compare_exchange_weak(p, &b, a, 5, 5);
    212 }
    213