Home | History | Annotate | Download | only in CodeGen
      1 // RUN: %clang_cc1 -triple x86_64-unknown-unknown -emit-llvm -o - %s| FileCheck %s
      2 // RUN: %clang_cc1 -triple x86_64-unknown-unknown -emit-llvm -o - %s -target-feature +avx | FileCheck %s -check-prefix=AVX
      3 #include <stdarg.h>
      4 
      5 // CHECK-LABEL: define signext i8 @f0()
      6 char f0(void) {
      7   return 0;
      8 }
      9 
     10 // CHECK-LABEL: define signext i16 @f1()
     11 short f1(void) {
     12   return 0;
     13 }
     14 
     15 // CHECK-LABEL: define i32 @f2()
     16 int f2(void) {
     17   return 0;
     18 }
     19 
     20 // CHECK-LABEL: define float @f3()
     21 float f3(void) {
     22   return 0;
     23 }
     24 
     25 // CHECK-LABEL: define double @f4()
     26 double f4(void) {
     27   return 0;
     28 }
     29 
     30 // CHECK-LABEL: define x86_fp80 @f5()
     31 long double f5(void) {
     32   return 0;
     33 }
     34 
     35 // CHECK-LABEL: define void @f6(i8 signext %a0, i16 signext %a1, i32 %a2, i64 %a3, i8* %a4)
     36 void f6(char a0, short a1, int a2, long long a3, void *a4) {
     37 }
     38 
     39 // CHECK-LABEL: define void @f7(i32 %a0)
     40 typedef enum { A, B, C } e7;
     41 void f7(e7 a0) {
     42 }
     43 
     44 // Test merging/passing of upper eightbyte with X87 class.
     45 //
     46 // CHECK-LABEL: define void @f8_1(%union.u8* noalias sret %agg.result)
     47 // CHECK-LABEL: define void @f8_2(%union.u8* byval align 16 %a0)
     48 union u8 {
     49   long double a;
     50   int b;
     51 };
     52 union u8 f8_1() { while (1) {} }
     53 void f8_2(union u8 a0) {}
     54 
     55 // CHECK-LABEL: define i64 @f9()
     56 struct s9 { int a; int b; int : 0; } f9(void) { while (1) {} }
     57 
     58 // CHECK-LABEL: define void @f10(i64 %a0.coerce)
     59 struct s10 { int a; int b; int : 0; };
     60 void f10(struct s10 a0) {}
     61 
     62 // CHECK-LABEL: define void @f11(%union.anon* noalias sret %agg.result)
     63 union { long double a; float b; } f11() { while (1) {} }
     64 
     65 // CHECK-LABEL: define i32 @f12_0()
     66 // CHECK-LABEL: define void @f12_1(i32 %a0.coerce)
     67 struct s12 { int a __attribute__((aligned(16))); };
     68 struct s12 f12_0(void) { while (1) {} }
     69 void f12_1(struct s12 a0) {}
     70 
     71 // Check that sret parameter is accounted for when checking available integer
     72 // registers.
     73 // CHECK: define void @f13(%struct.s13_0* noalias sret %agg.result, i32 %a, i32 %b, i32 %c, i32 %d, {{.*}}* byval align 8 %e, i32 %f)
     74 
     75 struct s13_0 { long long f0[3]; };
     76 struct s13_1 { long long f0[2]; };
     77 struct s13_0 f13(int a, int b, int c, int d,
     78                  struct s13_1 e, int f) { while (1) {} }
     79 
     80 // CHECK: define void @f14({{.*}}, i8 signext %X)
     81 void f14(int a, int b, int c, int d, int e, int f, char X) {}
     82 
     83 // CHECK: define void @f15({{.*}}, i8* %X)
     84 void f15(int a, int b, int c, int d, int e, int f, void *X) {}
     85 
     86 // CHECK: define void @f16({{.*}}, float %X)
     87 void f16(float a, float b, float c, float d, float e, float f, float g, float h,
     88          float X) {}
     89 
     90 // CHECK: define void @f17({{.*}}, x86_fp80 %X)
     91 void f17(float a, float b, float c, float d, float e, float f, float g, float h,
     92          long double X) {}
     93 
     94 // Check for valid coercion.  The struct should be passed/returned as i32, not
     95 // as i64 for better code quality.
     96 // rdar://8135035
     97 // CHECK-LABEL: define void @f18(i32 %a, i32 %f18_arg1.coerce)
     98 struct f18_s0 { int f0; };
     99 void f18(int a, struct f18_s0 f18_arg1) { while (1) {} }
    100 
    101 // Check byval alignment.
    102 
    103 // CHECK-LABEL: define void @f19(%struct.s19* byval align 16 %x)
    104 struct s19 {
    105   long double a;
    106 };
    107 void f19(struct s19 x) {}
    108 
    109 // CHECK-LABEL: define void @f20(%struct.s20* byval align 32 %x)
    110 struct __attribute__((aligned(32))) s20 {
    111   int x;
    112   int y;
    113 };
    114 void f20(struct s20 x) {}
    115 
    116 struct StringRef {
    117   long x;
    118   const char *Ptr;
    119 };
    120 
    121 // rdar://7375902
    122 // CHECK-LABEL: define i8* @f21(i64 %S.coerce0, i8* %S.coerce1)
    123 const char *f21(struct StringRef S) { return S.x+S.Ptr; }
    124 
    125 // PR7567
    126 typedef __attribute__ ((aligned(16))) struct f22s { unsigned long long x[2]; } L;
    127 void f22(L x, L y) { }
    128 // CHECK: @f22
    129 // CHECK: %x = alloca{{.*}}, align 16
    130 // CHECK: %y = alloca{{.*}}, align 16
    131 
    132 
    133 
    134 // PR7714
    135 struct f23S {
    136   short f0;
    137   unsigned f1;
    138   int f2;
    139 };
    140 
    141 
    142 void f23(int A, struct f23S B) {
    143   // CHECK-LABEL: define void @f23(i32 %A, i64 %B.coerce0, i32 %B.coerce1)
    144 }
    145 
    146 struct f24s { long a; int b; };
    147 
    148 struct f23S f24(struct f23S *X, struct f24s *P2) {
    149   return *X;
    150 
    151   // CHECK: define { i64, i32 } @f24(%struct.f23S* %X, %struct.f24s* %P2)
    152 }
    153 
    154 // rdar://8248065
    155 typedef float v4f32 __attribute__((__vector_size__(16)));
    156 v4f32 f25(v4f32 X) {
    157   // CHECK-LABEL: define <4 x float> @f25(<4 x float> %X)
    158   // CHECK-NOT: alloca
    159   // CHECK: alloca <4 x float>
    160   // CHECK-NOT: alloca
    161   // CHECK: store <4 x float> %X, <4 x float>*
    162   // CHECK-NOT: store
    163   // CHECK: ret <4 x float>
    164   return X+X;
    165 }
    166 
    167 struct foo26 {
    168   int *X;
    169   float *Y;
    170 };
    171 
    172 struct foo26 f26(struct foo26 *P) {
    173   // CHECK: define { i32*, float* } @f26(%struct.foo26* %P)
    174   return *P;
    175 }
    176 
    177 
    178 struct v4f32wrapper {
    179   v4f32 v;
    180 };
    181 
    182 struct v4f32wrapper f27(struct v4f32wrapper X) {
    183   // CHECK-LABEL: define <4 x float> @f27(<4 x float> %X.coerce)
    184   return X;
    185 }
    186 
    187 // PR22563 - We should unwrap simple structs and arrays to pass
    188 // and return them in the appropriate vector registers if possible.
    189 
    190 typedef float v8f32 __attribute__((__vector_size__(32)));
    191 struct v8f32wrapper {
    192   v8f32 v;
    193 };
    194 
    195 struct v8f32wrapper f27a(struct v8f32wrapper X) {
    196   // AVX-LABEL: define <8 x float> @f27a(<8 x float> %X.coerce)
    197   return X;
    198 }
    199 
    200 struct v8f32wrapper_wrapper {
    201   v8f32 v[1];
    202 };
    203 
    204 struct v8f32wrapper_wrapper f27b(struct v8f32wrapper_wrapper X) {
    205   // AVX-LABEL: define <8 x float> @f27b(<8 x float> %X.coerce)
    206   return X;
    207 }
    208 
    209 // rdar://5711709
    210 struct f28c {
    211   double x;
    212   int y;
    213 };
    214 void f28(struct f28c C) {
    215   // CHECK-LABEL: define void @f28(double %C.coerce0, i32 %C.coerce1)
    216 }
    217 
    218 struct f29a {
    219   struct c {
    220     double x;
    221     int y;
    222   } x[1];
    223 };
    224 
    225 void f29a(struct f29a A) {
    226   // CHECK-LABEL: define void @f29a(double %A.coerce0, i32 %A.coerce1)
    227 }
    228 
    229 // rdar://8249586
    230 struct S0 { char f0[8]; char f2; char f3; char f4; };
    231 void f30(struct S0 p_4) {
    232   // CHECK-LABEL: define void @f30(i64 %p_4.coerce0, i24 %p_4.coerce1)
    233 }
    234 
    235 // Pass the third element as a float when followed by tail padding.
    236 // rdar://8251384
    237 struct f31foo { float a, b, c; };
    238 float f31(struct f31foo X) {
    239   // CHECK-LABEL: define float @f31(<2 x float> %X.coerce0, float %X.coerce1)
    240   return X.c;
    241 }
    242 
    243 _Complex float f32(_Complex float A, _Complex float B) {
    244   // rdar://6379669
    245   // CHECK-LABEL: define <2 x float> @f32(<2 x float> %A.coerce, <2 x float> %B.coerce)
    246   return A+B;
    247 }
    248 
    249 
    250 // rdar://8357396
    251 struct f33s { long x; float c,d; };
    252 
    253 void f33(va_list X) {
    254   va_arg(X, struct f33s);
    255 }
    256 
    257 typedef unsigned long long v1i64 __attribute__((__vector_size__(8)));
    258 
    259 // rdar://8359248
    260 // CHECK-LABEL: define i64 @f34(i64 %arg.coerce)
    261 v1i64 f34(v1i64 arg) { return arg; }
    262 
    263 
    264 // rdar://8358475
    265 // CHECK-LABEL: define i64 @f35(i64 %arg.coerce)
    266 typedef unsigned long v1i64_2 __attribute__((__vector_size__(8)));
    267 v1i64_2 f35(v1i64_2 arg) { return arg+arg; }
    268 
    269 // rdar://9122143
    270 // CHECK: declare void @func(%struct._str* byval align 16)
    271 typedef struct _str {
    272   union {
    273     long double a;
    274     long c;
    275   };
    276 } str;
    277 
    278 void func(str s);
    279 str ss;
    280 void f9122143()
    281 {
    282   func(ss);
    283 }
    284 
    285 // CHECK-LABEL: define double @f36(double %arg.coerce)
    286 typedef unsigned v2i32 __attribute((__vector_size__(8)));
    287 v2i32 f36(v2i32 arg) { return arg; }
    288 
    289 // AVX: declare void @f38(<8 x float>)
    290 // AVX: declare void @f37(<8 x float>)
    291 // CHECK: declare void @f38(%struct.s256* byval align 32)
    292 // CHECK: declare void @f37(<8 x float>* byval align 32)
    293 typedef float __m256 __attribute__ ((__vector_size__ (32)));
    294 typedef struct {
    295   __m256 m;
    296 } s256;
    297 
    298 s256 x38;
    299 __m256 x37;
    300 
    301 void f38(s256 x);
    302 void f37(__m256 x);
    303 void f39() { f38(x38); f37(x37); }
    304 
    305 // The two next tests make sure that the struct below is passed
    306 // in the same way regardless of avx being used
    307 
    308 // CHECK: declare void @func40(%struct.t128* byval align 16)
    309 typedef float __m128 __attribute__ ((__vector_size__ (16)));
    310 typedef struct t128 {
    311   __m128 m;
    312   __m128 n;
    313 } two128;
    314 
    315 extern void func40(two128 s);
    316 void func41(two128 s) {
    317   func40(s);
    318 }
    319 
    320 // CHECK: declare void @func42(%struct.t128_2* byval align 16)
    321 typedef struct xxx {
    322   __m128 array[2];
    323 } Atwo128;
    324 typedef struct t128_2 {
    325   Atwo128 x;
    326 } SA;
    327 
    328 extern void func42(SA s);
    329 void func43(SA s) {
    330   func42(s);
    331 }
    332 
    333 // CHECK-LABEL: define i32 @f44
    334 // CHECK: ptrtoint
    335 // CHECK-NEXT: and {{.*}}, -32
    336 // CHECK-NEXT: inttoptr
    337 typedef int T44 __attribute((vector_size(32)));
    338 struct s44 { T44 x; int y; };
    339 int f44(int i, ...) {
    340   __builtin_va_list ap;
    341   __builtin_va_start(ap, i);
    342   struct s44 s = __builtin_va_arg(ap, struct s44);
    343   __builtin_va_end(ap);
    344   return s.y;
    345 }
    346 
    347 // Text that vec3 returns the correct LLVM IR type.
    348 // AVX-LABEL: define i32 @foo(<3 x i64> %X)
    349 typedef long long3 __attribute((ext_vector_type(3)));
    350 int foo(long3 X)
    351 {
    352   return 0;
    353 }
    354 
    355 // Make sure we don't use a varargs convention for a function without a
    356 // prototype where AVX types are involved.
    357 // AVX: @test45
    358 // AVX: call i32 bitcast (i32 (...)* @f45 to i32 (<8 x float>)*)
    359 int f45();
    360 __m256 x45;
    361 void test45() { f45(x45); }
    362 
    363 // Make sure we use byval to pass 64-bit vectors in memory; the LLVM call
    364 // lowering can't handle this case correctly because it runs after legalization.
    365 // CHECK: @test46
    366 // CHECK: call void @f46({{.*}}<2 x float>* byval align 8 {{.*}}, <2 x float>* byval align 8 {{.*}})
    367 typedef float v46 __attribute((vector_size(8)));
    368 void f46(v46,v46,v46,v46,v46,v46,v46,v46,v46,v46);
    369 void test46() { v46 x = {1,2}; f46(x,x,x,x,x,x,x,x,x,x); }
    370 
    371 // Check that we pass the struct below without using byval, which helps out
    372 // codegen.
    373 //
    374 // CHECK: @test47
    375 // CHECK: call void @f47(i32 {{.*}}, i32 {{.*}}, i32 {{.*}}, i32 {{.*}}, i32 {{.*}}, i32 {{.*}}, i32 {{.*}})
    376 struct s47 { unsigned a; };
    377 void f47(int,int,int,int,int,int,struct s47);
    378 void test47(int a, struct s47 b) { f47(a, a, a, a, a, a, b); }
    379 
    380 // rdar://12723368
    381 // In the following example, there are holes in T4 at the 3rd byte and the 4th
    382 // byte, however, T2 does not have those holes. T4 is chosen to be the
    383 // representing type for union T1, but we can't use load or store of T4 since
    384 // it will skip the 3rd byte and the 4th byte.
    385 // In general, Since we don't accurately represent the data fields of a union,
    386 // do not use load or store of the representing llvm type for the union.
    387 typedef _Complex int T2;
    388 typedef _Complex char T5;
    389 typedef _Complex int T7;
    390 typedef struct T4 { T5 field0; T7 field1; } T4;
    391 typedef union T1 { T2 field0; T4 field1; } T1;
    392 extern T1 T1_retval;
    393 T1 test48(void) {
    394 // CHECK: @test48
    395 // CHECK: memcpy
    396 // CHECK: memcpy
    397   return T1_retval;
    398 }
    399 
    400 void test49_helper(double, ...);
    401 void test49(double d, double e) {
    402   test49_helper(d, e);
    403 }
    404 // CHECK-LABEL:    define void @test49(
    405 // CHECK:      [[T0:%.*]] = load double, double*
    406 // CHECK-NEXT: [[T1:%.*]] = load double, double*
    407 // CHECK-NEXT: call void (double, ...) @test49_helper(double [[T0]], double [[T1]])
    408 
    409 void test50_helper();
    410 void test50(double d, double e) {
    411   test50_helper(d, e);
    412 }
    413 // CHECK-LABEL:    define void @test50(
    414 // CHECK:      [[T0:%.*]] = load double, double*
    415 // CHECK-NEXT: [[T1:%.*]] = load double, double*
    416 // CHECK-NEXT: call void (double, double, ...) bitcast (void (...)* @test50_helper to void (double, double, ...)*)(double [[T0]], double [[T1]])
    417 
    418 struct test51_s { __uint128_t intval; };
    419 void test51(struct test51_s *s, __builtin_va_list argList) {
    420     *s = __builtin_va_arg(argList, struct test51_s);
    421 }
    422 
    423 // CHECK-LABEL: define void @test51
    424 // CHECK: [[TMP_ADDR:%.*]] = alloca [[STRUCT_TEST51:%.*]], align 16
    425 // CHECK: br i1
    426 // CHECK: [[REG_SAVE_AREA_PTR:%.*]] = getelementptr inbounds {{.*}}, i32 0, i32 3
    427 // CHECK-NEXT: [[REG_SAVE_AREA:%.*]] = load i8*, i8** [[REG_SAVE_AREA_PTR]]
    428 // CHECK-NEXT: [[VALUE_ADDR:%.*]] = getelementptr i8, i8* [[REG_SAVE_AREA]], i32 {{.*}}
    429 // CHECK-NEXT: [[CASTED_VALUE_ADDR:%.*]] = bitcast i8* [[VALUE_ADDR]] to [[STRUCT_TEST51]]
    430 // CHECK-NEXT: [[CASTED_TMP_ADDR:%.*]] = bitcast [[STRUCT_TEST51]]* [[TMP_ADDR]] to i8*
    431 // CHECK-NEXT: [[RECASTED_VALUE_ADDR:%.*]] = bitcast [[STRUCT_TEST51]]* [[CASTED_VALUE_ADDR]] to i8*
    432 // CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* [[CASTED_TMP_ADDR]], i8* [[RECASTED_VALUE_ADDR]], i64 16, i32 8, i1 false)
    433 // CHECK-NEXT: add i32 {{.*}}, 16
    434 // CHECK-NEXT: store i32 {{.*}}, i32* {{.*}}
    435 // CHECK-NEXT: br label
    436 
    437 void test52_helper(int, ...);
    438 __m256 x52;
    439 void test52() {
    440   test52_helper(0, x52, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
    441 }
    442 // AVX: @test52_helper(i32 0, <8 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double {{%[a-zA-Z0-9]+}}, double {{%[a-zA-Z0-9]+}})
    443 
    444 void test53(__m256 *m, __builtin_va_list argList) {
    445   *m = __builtin_va_arg(argList, __m256);
    446 }
    447 // AVX-LABEL: define void @test53
    448 // AVX-NOT: br i1
    449 // AVX: ret void
    450 
    451 void test54_helper(__m256, ...);
    452 __m256 x54;
    453 void test54() {
    454   test54_helper(x54, x54, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
    455   test54_helper(x54, x54, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0i);
    456 }
    457 // AVX: @test54_helper(<8 x float> {{%[a-zA-Z0-9]+}}, <8 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double {{%[a-zA-Z0-9]+}}, double {{%[a-zA-Z0-9]+}})
    458 // AVX: @test54_helper(<8 x float> {{%[a-zA-Z0-9]+}}, <8 x float> {{%[a-zA-Z0-9]+}}, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, double 1.000000e+00, { double, double }* byval align 8 {{%[a-zA-Z0-9]+}})
    459