1 ; RUN: llc -mtriple armv7a-none-eabi -mattr=-neon < %s -verify-machineinstrs -o - | FileCheck %s 2 3 ; Thumb1 (thumbv6m) is tested in tests/Thumb 4 5 @a = external global i32* 6 @b = external global i32* 7 8 ; Function Attrs: nounwind 9 define void @foo24() #0 { 10 entry: 11 ; CHECK-LABEL: foo24: 12 ; We use '[rl0-9]*' to allow 'r0'..'r12', 'lr' 13 ; CHECK: movt [[LB:[rl0-9]+]], :upper16:b 14 ; CHECK: movt [[SB:[rl0-9]+]], :upper16:a 15 ; CHECK: add [[NLB:[rl0-9]+]], [[LB]], #4 16 ; CHECK: add [[NSB:[rl0-9]+]], [[SB]], #4 17 ; CHECK-NEXT: ldm [[NLB]], {[[R1:[rl0-9]+]], [[R2:[rl0-9]+]], [[R3:[rl0-9]+]], [[R4:[rl0-9]+]], [[R5:[rl0-9]+]], [[R6:[rl0-9]+]]} 18 ; CHECK-NEXT: stm [[NSB]], {[[R1]], [[R2]], [[R3]], [[R4]], [[R5]], [[R6]]} 19 %0 = load i32*, i32** @a, align 4 20 %arrayidx = getelementptr inbounds i32, i32* %0, i32 1 21 %1 = bitcast i32* %arrayidx to i8* 22 %2 = load i32*, i32** @b, align 4 23 %arrayidx1 = getelementptr inbounds i32, i32* %2, i32 1 24 %3 = bitcast i32* %arrayidx1 to i8* 25 tail call void @llvm.memcpy.p0i8.p0i8.i32(i8* %1, i8* %3, i32 24, i32 4, i1 false) 26 ret void 27 } 28 29 define void @foo28() #0 { 30 entry: 31 ; CHECK-LABEL: foo28: 32 ; CHECK: movt [[LB:[rl0-9]+]], :upper16:b 33 ; CHECK: movt [[SB:[rl0-9]+]], :upper16:a 34 ; CHECK: add [[NLB:[rl0-9]+]], [[LB]], #4 35 ; CHECK: add [[NSB:[rl0-9]+]], [[SB]], #4 36 ; CHECK-NEXT: ldm [[NLB]]!, {[[R1:[rl0-9]+]], [[R2:[rl0-9]+]], [[R3:[rl0-9]+]]} 37 ; CHECK-NEXT: stm [[NSB]]!, {[[R1]], [[R2]], [[R3]]} 38 ; CHECK-NEXT: ldm [[NLB]], {[[R1:[rl0-9]+]], [[R2:[rl0-9]+]], [[R3:[rl0-9]+]], [[R4:[rl0-9]+]]} 39 ; CHECK-NEXT: stm [[NSB]], {[[R1]], [[R2]], [[R3]], [[R4]]} 40 %0 = load i32*, i32** @a, align 4 41 %arrayidx = getelementptr inbounds i32, i32* %0, i32 1 42 %1 = bitcast i32* %arrayidx to i8* 43 %2 = load i32*, i32** @b, align 4 44 %arrayidx1 = getelementptr inbounds i32, i32* %2, i32 1 45 %3 = bitcast i32* %arrayidx1 to i8* 46 tail call void @llvm.memcpy.p0i8.p0i8.i32(i8* %1, i8* %3, i32 28, i32 4, i1 false) 47 ret void 48 } 49 50 define void @foo32() #0 { 51 entry: 52 ; CHECK-LABEL: foo32: 53 ; CHECK: movt [[LB:[rl0-9]+]], :upper16:b 54 ; CHECK: movt [[SB:[rl0-9]+]], :upper16:a 55 ; CHECK: add [[NLB:[rl0-9]+]], [[LB]], #4 56 ; CHECK: add [[NSB:[rl0-9]+]], [[SB]], #4 57 ; CHECK-NEXT: ldm [[NLB]]!, {[[R1:[rl0-9]+]], [[R2:[rl0-9]+]], [[R3:[rl0-9]+]], [[R4:[rl0-9]+]]} 58 ; CHECK-NEXT: stm [[NSB]]!, {[[R1]], [[R2]], [[R3]], [[R4]]} 59 ; CHECK-NEXT: ldm [[NLB]], {[[R1:[rl0-9]+]], [[R2:[rl0-9]+]], [[R3:[rl0-9]+]], [[R4:[rl0-9]+]]} 60 ; CHECK-NEXT: stm [[NSB]], {[[R1]], [[R2]], [[R3]], [[R4]]} 61 %0 = load i32*, i32** @a, align 4 62 %arrayidx = getelementptr inbounds i32, i32* %0, i32 1 63 %1 = bitcast i32* %arrayidx to i8* 64 %2 = load i32*, i32** @b, align 4 65 %arrayidx1 = getelementptr inbounds i32, i32* %2, i32 1 66 %3 = bitcast i32* %arrayidx1 to i8* 67 tail call void @llvm.memcpy.p0i8.p0i8.i32(i8* %1, i8* %3, i32 32, i32 4, i1 false) 68 ret void 69 } 70 71 define void @foo36() #0 { 72 entry: 73 ; CHECK-LABEL: foo36: 74 ; CHECK: movt [[LB:[rl0-9]+]], :upper16:b 75 ; CHECK: movt [[SB:[rl0-9]+]], :upper16:a 76 ; CHECK: add [[NLB:[rl0-9]+]], [[LB]], #4 77 ; CHECK: add [[NSB:[rl0-9]+]], [[SB]], #4 78 ; CHECK-NEXT: ldm [[NLB]]!, {[[R1:[rl0-9]+]], [[R2:[rl0-9]+]], [[R3:[rl0-9]+]], [[R4:[rl0-9]+]]} 79 ; CHECK-NEXT: stm [[NSB]]!, {[[R1]], [[R2]], [[R3]], [[R4]]} 80 ; CHECK-NEXT: ldm [[NLB]], {[[R1:[rl0-9]+]], [[R2:[rl0-9]+]], [[R3:[rl0-9]+]], [[R4:[rl0-9]+]], [[R5:[rl0-9]+]]} 81 ; CHECK-NEXT: stm [[NSB]], {[[R1]], [[R2]], [[R3]], [[R4]], [[R5]]} 82 %0 = load i32*, i32** @a, align 4 83 %arrayidx = getelementptr inbounds i32, i32* %0, i32 1 84 %1 = bitcast i32* %arrayidx to i8* 85 %2 = load i32*, i32** @b, align 4 86 %arrayidx1 = getelementptr inbounds i32, i32* %2, i32 1 87 %3 = bitcast i32* %arrayidx1 to i8* 88 tail call void @llvm.memcpy.p0i8.p0i8.i32(i8* %1, i8* %3, i32 36, i32 4, i1 false) 89 ret void 90 } 91 92 ; Function Attrs: nounwind 93 declare void @llvm.memcpy.p0i8.p0i8.i32(i8* nocapture, i8* nocapture readonly, i32, i32, i1) #1 94