Home | History | Annotate | Download | only in X86
      1 ; RUN: llc < %s -mattr=-avx -fast-isel -mcpu=core2 -O0 -regalloc=fast -asm-verbose=0 -fast-isel-abort=1 | FileCheck %s
      2 ; RUN: llc < %s -mattr=+avx -fast-isel -mcpu=core2 -O0 -regalloc=fast -asm-verbose=0 -fast-isel-abort=1 | FileCheck %s --check-prefix=AVX
      3 
      4 target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
      5 target triple = "x86_64-apple-darwin10.0.0"
      6 
      7 ; Make sure that fast-isel folds the immediate into the binop even though it
      8 ; is non-canonical.
      9 define i32 @test1(i32 %i) nounwind ssp {
     10   %and = and i32 8, %i
     11   ret i32 %and
     12 }
     13 
     14 ; CHECK-LABEL: test1:
     15 ; CHECK: andl	$8, 
     16 
     17 
     18 ; rdar://9289512 - The load should fold into the compare.
     19 define void @test2(i64 %x) nounwind ssp {
     20 entry:
     21   %x.addr = alloca i64, align 8
     22   store i64 %x, i64* %x.addr, align 8
     23   %tmp = load i64, i64* %x.addr, align 8
     24   %cmp = icmp sgt i64 %tmp, 42
     25   br i1 %cmp, label %if.then, label %if.end
     26 
     27 if.then:                                          ; preds = %entry
     28   br label %if.end
     29 
     30 if.end:                                           ; preds = %if.then, %entry
     31   ret void
     32 ; CHECK-LABEL: test2:
     33 ; CHECK: movq	%rdi, -8(%rsp)
     34 ; CHECK: cmpq	$42, -8(%rsp)
     35 }
     36 
     37 
     38 
     39 
     40 @G = external global i32
     41 define i64 @test3() nounwind {
     42   %A = ptrtoint i32* @G to i64
     43   ret i64 %A
     44 ; CHECK-LABEL: test3:
     45 ; CHECK: movq _G@GOTPCREL(%rip), %rax
     46 ; CHECK-NEXT: ret
     47 }
     48 
     49 
     50 
     51 ; rdar://9289558
     52 @rtx_length = external global [153 x i8]
     53 
     54 define i32 @test4(i64 %idxprom9) nounwind {
     55   %arrayidx10 = getelementptr inbounds [153 x i8], [153 x i8]* @rtx_length, i32 0, i64 %idxprom9
     56   %tmp11 = load i8, i8* %arrayidx10, align 1
     57   %conv = zext i8 %tmp11 to i32
     58   ret i32 %conv
     59 
     60 ; CHECK-LABEL: test4:
     61 ; CHECK: movq	_rtx_length@GOTPCREL(%rip), %rax
     62 ; CHECK-NEXT: movzbl	(%rax,%rdi), %eax
     63 ; CHECK-NEXT: ret
     64 }
     65 
     66 
     67 ; PR3242 - Out of range shifts should not be folded by fastisel.
     68 define void @test5(i32 %x, i32* %p) nounwind {
     69   %y = ashr i32 %x, 50000
     70   store i32 %y, i32* %p
     71   ret void
     72 
     73 ; CHECK-LABEL: test5:
     74 ; CHECK: movl	$50000, %ecx
     75 ; CHECK: sarl	%cl, %edi
     76 ; CHECK: ret
     77 }
     78 
     79 ; rdar://9289501 - fast isel should fold trivial multiplies to shifts.
     80 define i64 @test6(i64 %x) nounwind ssp {
     81 entry:
     82   %mul = mul nsw i64 %x, 8
     83   ret i64 %mul
     84 
     85 ; CHECK-LABEL: test6:
     86 ; CHECK: shlq	$3, %rdi
     87 }
     88 
     89 define i32 @test7(i32 %x) nounwind ssp {
     90 entry:
     91   %mul = mul nsw i32 %x, 8
     92   ret i32 %mul
     93 ; CHECK-LABEL: test7:
     94 ; CHECK: shll	$3, %edi
     95 }
     96 
     97 
     98 ; rdar://9289507 - folding of immediates into 64-bit operations.
     99 define i64 @test8(i64 %x) nounwind ssp {
    100 entry:
    101   %add = add nsw i64 %x, 7
    102   ret i64 %add
    103 
    104 ; CHECK-LABEL: test8:
    105 ; CHECK: addq	$7, %rdi
    106 }
    107 
    108 define i64 @test9(i64 %x) nounwind ssp {
    109 entry:
    110   %add = mul nsw i64 %x, 7
    111   ret i64 %add
    112 ; CHECK-LABEL: test9:
    113 ; CHECK: imulq	$7, %rdi, %rax
    114 }
    115 
    116 ; rdar://9297011 - Don't reject udiv by a power of 2.
    117 define i32 @test10(i32 %X) nounwind {
    118   %Y = udiv i32 %X, 8
    119   ret i32 %Y
    120 ; CHECK-LABEL: test10:
    121 ; CHECK: shrl	$3, 
    122 }
    123 
    124 define i32 @test11(i32 %X) nounwind {
    125   %Y = sdiv exact i32 %X, 8
    126   ret i32 %Y
    127 ; CHECK-LABEL: test11:
    128 ; CHECK: sarl	$3, 
    129 }
    130 
    131 
    132 ; rdar://9297006 - Trunc to bool.
    133 define void @test12(i8 %tmp) nounwind ssp noredzone {
    134 entry:
    135   %tobool = trunc i8 %tmp to i1
    136   br i1 %tobool, label %if.then, label %if.end
    137 
    138 if.then:                                          ; preds = %entry
    139   call void @test12(i8 0) noredzone
    140   br label %if.end
    141 
    142 if.end:                                           ; preds = %if.then, %entry
    143   ret void
    144 ; CHECK-LABEL: test12:
    145 ; CHECK: testb	$1,
    146 ; CHECK-NEXT: je L
    147 ; CHECK-NEXT: xorl %edi, %edi
    148 ; CHECK-NEXT: callq
    149 }
    150 
    151 declare void @test13f(i1 %X)
    152 
    153 define void @test13() nounwind {
    154   call void @test13f(i1 0)
    155   ret void
    156 ; CHECK-LABEL: test13:
    157 ; CHECK: xorl %edi, %edi
    158 ; CHECK-NEXT: callq
    159 }
    160 
    161 
    162 
    163 ; rdar://9297003 - fast isel bails out on all functions taking bools
    164 define void @test14(i8 %tmp) nounwind ssp noredzone {
    165 entry:
    166   %tobool = trunc i8 %tmp to i1
    167   call void @test13f(i1 zeroext %tobool) noredzone
    168   ret void
    169 ; CHECK-LABEL: test14:
    170 ; CHECK: andb	$1, 
    171 ; CHECK: callq
    172 }
    173 
    174 declare void @llvm.memcpy.p0i8.p0i8.i64(i8*, i8*, i64, i32, i1)
    175 
    176 ; rdar://9289488 - fast-isel shouldn't bail out on llvm.memcpy
    177 define void @test15(i8* %a, i8* %b) nounwind {
    178   call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a, i8* %b, i64 4, i32 4, i1 false)
    179   ret void
    180 ; CHECK-LABEL: test15:
    181 ; CHECK-NEXT: movl	(%rsi), %eax
    182 ; CHECK-NEXT: movl	%eax, (%rdi)
    183 ; CHECK-NEXT: ret
    184 }
    185 
    186 ; Handling for varargs calls
    187 declare void @test16callee(...) nounwind
    188 define void @test16() nounwind {
    189 ; CHECK-LABEL: test16:
    190 ; CHECK: movl $1, %edi
    191 ; CHECK: movb $0, %al
    192 ; CHECK: callq _test16callee
    193   call void (...) @test16callee(i32 1)
    194   br label %block2
    195 
    196 block2:
    197 ; CHECK: movsd LCP{{.*}}_{{.*}}(%rip), %xmm0
    198 ; CHECK: movb $1, %al
    199 ; CHECK: callq _test16callee
    200 
    201 ; AVX: vmovsd LCP{{.*}}_{{.*}}(%rip), %xmm0
    202 ; AVX: movb $1, %al
    203 ; AVX: callq _test16callee
    204   call void (...) @test16callee(double 1.000000e+00)
    205   ret void
    206 }
    207 
    208 
    209 declare void @foo() unnamed_addr ssp align 2
    210 
    211 ; Verify that we don't fold the load into the compare here.  That would move it
    212 ; w.r.t. the call.
    213 define i32 @test17(i32 *%P) ssp nounwind {
    214 entry:
    215   %tmp = load i32, i32* %P
    216   %cmp = icmp ne i32 %tmp, 5
    217   call void @foo()
    218   br i1 %cmp, label %if.then, label %if.else
    219 
    220 if.then:                                          ; preds = %entry
    221   ret i32 1
    222 
    223 if.else:                                          ; preds = %entry
    224   ret i32 2
    225 ; CHECK-LABEL: test17:
    226 ; CHECK: movl	(%rdi), %eax
    227 ; CHECK: callq _foo
    228 ; CHECK: cmpl	$5, %eax
    229 ; CHECK-NEXT: je 
    230 }
    231 
    232 ; Check that 0.0 is materialized using xorps
    233 define void @test18(float* %p1) {
    234   store float 0.0, float* %p1
    235   ret void
    236 ; CHECK-LABEL: test18:
    237 ; CHECK: xorps
    238 }
    239 
    240 ; Without any type hints, doubles use the smaller xorps instead of xorpd.
    241 define void @test19(double* %p1) {
    242   store double 0.0, double* %p1
    243   ret void
    244 ; CHECK-LABEL: test19:
    245 ; CHECK: xorps
    246 }
    247 
    248 ; Check that we fast-isel sret
    249 %struct.a = type { i64, i64, i64 }
    250 define void @test20() nounwind ssp {
    251 entry:
    252   %tmp = alloca %struct.a, align 8
    253   call void @test20sret(%struct.a* sret %tmp)
    254   ret void
    255 ; CHECK-LABEL: test20:
    256 ; CHECK: leaq (%rsp), %rdi
    257 ; CHECK: callq _test20sret
    258 }
    259 declare void @test20sret(%struct.a* sret)
    260 
    261 ; Check that -0.0 is not materialized using xor
    262 define void @test21(double* %p1) {
    263   store double -0.0, double* %p1
    264   ret void
    265 ; CHECK-LABEL: test21:
    266 ; CHECK-NOT: xor
    267 ; CHECK: movsd	LCPI
    268 }
    269 
    270 ; Check that immediate arguments to a function
    271 ; do not cause massive spilling and are used
    272 ; as immediates just before the call.
    273 define void @test22() nounwind {
    274 entry:
    275   call void @foo22(i32 0)
    276   call void @foo22(i32 1)
    277   call void @foo22(i32 2)
    278   call void @foo22(i32 3)
    279   ret void
    280 ; CHECK-LABEL: test22:
    281 ; CHECK: xorl	%edi, %edi
    282 ; CHECK: callq	_foo22
    283 ; CHECK: movl	$1, %edi
    284 ; CHECK: callq	_foo22
    285 ; CHECK: movl	$2, %edi
    286 ; CHECK: callq	_foo22
    287 ; CHECK: movl	$3, %edi
    288 ; CHECK: callq	_foo22
    289 }
    290 
    291 declare void @foo22(i32)
    292 
    293 ; PR13563
    294 define void @test23(i8* noalias sret %result) {
    295   %a = alloca i8
    296   %b = call i8* @foo23()
    297   ret void
    298 ; CHECK-LABEL: test23:
    299 ; CHECK: call
    300 ; CHECK: movq  %rdi, %rax
    301 ; CHECK: ret
    302 }
    303 
    304 declare i8* @foo23()
    305 
    306 declare void @takesi32ptr(i32* %arg)
    307 
    308 ; CHECK-LABEL: allocamaterialize
    309 define void @allocamaterialize() {
    310   %a = alloca i32
    311 ; CHECK: leaq {{.*}}, %rdi
    312   call void @takesi32ptr(i32* %a)
    313   ret void
    314 }
    315