1 ; RUN: llc -mcpu cortex-a53 < %s | FileCheck %s 2 target datalayout = "e-m:e-i64:64-i128:128-n8:16:32:64-S128" 3 target triple = "aarch64--linux-gnu" 4 5 declare void @f(i8*, i8*) 6 declare void @f2(i8*, i8*) 7 declare void @_Z5setupv() 8 declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i1) #3 9 10 define i32 @main() local_unnamed_addr #1 { 11 ; Make sure the stores happen in the correct order (the exact instructions could change). 12 ; CHECK-LABEL: main: 13 ; CHECK: stp xzr, xzr, [sp, #72] 14 ; CHECK: str w9, [sp, #80] 15 ; CHECK: str q0, [sp, #48] 16 ; CHECK: ldr w8, [sp, #48] 17 ; CHECK: str q0, [sp, #64] 18 19 for.body.lr.ph.i.i.i.i.i.i63: 20 %b1 = alloca [10 x i32], align 16 21 %x0 = bitcast [10 x i32]* %b1 to i8* 22 %b2 = alloca [10 x i32], align 16 23 %x1 = bitcast [10 x i32]* %b2 to i8* 24 tail call void @_Z5setupv() 25 %x2 = getelementptr inbounds [10 x i32], [10 x i32]* %b1, i64 0, i64 6 26 %x3 = bitcast i32* %x2 to i8* 27 call void @llvm.memset.p0i8.i64(i8* align 8 %x3, i8 0, i64 16, i1 false) 28 %arraydecay2 = getelementptr inbounds [10 x i32], [10 x i32]* %b1, i64 0, i64 0 29 %x4 = bitcast [10 x i32]* %b1 to <4 x i32>* 30 store <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32>* %x4, align 16 31 %incdec.ptr.i7.i.i.i.i.i.i64.3 = getelementptr inbounds [10 x i32], [10 x i32]* %b1, i64 0, i64 4 32 %x5 = bitcast i32* %incdec.ptr.i7.i.i.i.i.i.i64.3 to <4 x i32>* 33 store <4 x i32> <i32 1, i32 1, i32 1, i32 1>, <4 x i32>* %x5, align 16 34 %incdec.ptr.i7.i.i.i.i.i.i64.7 = getelementptr inbounds [10 x i32], [10 x i32]* %b1, i64 0, i64 8 35 store i32 1, i32* %incdec.ptr.i7.i.i.i.i.i.i64.7, align 16 36 %x6 = load i32, i32* %arraydecay2, align 16 37 %cmp6 = icmp eq i32 %x6, 1 38 br i1 %cmp6, label %for.inc, label %if.then 39 40 for.inc: 41 call void @f(i8* %x0, i8* %x1) 42 ret i32 0 43 44 if.then: 45 call void @f2(i8* %x0, i8* %x1) 46 ret i32 0 47 } 48