1 ;; Both functions in this testcase should codegen to the same function, and 2 ;; neither of them should require spilling anything to the stack. 3 4 ; RUN: llc < %s -march=x86 -stats |& \ 5 ; RUN: not grep {Number of register spills} 6 7 ;; This can be compiled to use three registers if the loads are not 8 ;; folded into the multiplies, 2 registers otherwise. 9 10 define i32 @regpressure1(i32* %P) { 11 %A = load i32* %P ; <i32> [#uses=1] 12 %Bp = getelementptr i32* %P, i32 1 ; <i32*> [#uses=1] 13 %B = load i32* %Bp ; <i32> [#uses=1] 14 %s1 = mul i32 %A, %B ; <i32> [#uses=1] 15 %Cp = getelementptr i32* %P, i32 2 ; <i32*> [#uses=1] 16 %C = load i32* %Cp ; <i32> [#uses=1] 17 %s2 = mul i32 %s1, %C ; <i32> [#uses=1] 18 %Dp = getelementptr i32* %P, i32 3 ; <i32*> [#uses=1] 19 %D = load i32* %Dp ; <i32> [#uses=1] 20 %s3 = mul i32 %s2, %D ; <i32> [#uses=1] 21 %Ep = getelementptr i32* %P, i32 4 ; <i32*> [#uses=1] 22 %E = load i32* %Ep ; <i32> [#uses=1] 23 %s4 = mul i32 %s3, %E ; <i32> [#uses=1] 24 %Fp = getelementptr i32* %P, i32 5 ; <i32*> [#uses=1] 25 %F = load i32* %Fp ; <i32> [#uses=1] 26 %s5 = mul i32 %s4, %F ; <i32> [#uses=1] 27 %Gp = getelementptr i32* %P, i32 6 ; <i32*> [#uses=1] 28 %G = load i32* %Gp ; <i32> [#uses=1] 29 %s6 = mul i32 %s5, %G ; <i32> [#uses=1] 30 %Hp = getelementptr i32* %P, i32 7 ; <i32*> [#uses=1] 31 %H = load i32* %Hp ; <i32> [#uses=1] 32 %s7 = mul i32 %s6, %H ; <i32> [#uses=1] 33 %Ip = getelementptr i32* %P, i32 8 ; <i32*> [#uses=1] 34 %I = load i32* %Ip ; <i32> [#uses=1] 35 %s8 = mul i32 %s7, %I ; <i32> [#uses=1] 36 %Jp = getelementptr i32* %P, i32 9 ; <i32*> [#uses=1] 37 %J = load i32* %Jp ; <i32> [#uses=1] 38 %s9 = mul i32 %s8, %J ; <i32> [#uses=1] 39 ret i32 %s9 40 } 41 42 define i32 @regpressure2(i32* %P) { 43 %A = load i32* %P ; <i32> [#uses=1] 44 %Bp = getelementptr i32* %P, i32 1 ; <i32*> [#uses=1] 45 %B = load i32* %Bp ; <i32> [#uses=1] 46 %Cp = getelementptr i32* %P, i32 2 ; <i32*> [#uses=1] 47 %C = load i32* %Cp ; <i32> [#uses=1] 48 %Dp = getelementptr i32* %P, i32 3 ; <i32*> [#uses=1] 49 %D = load i32* %Dp ; <i32> [#uses=1] 50 %Ep = getelementptr i32* %P, i32 4 ; <i32*> [#uses=1] 51 %E = load i32* %Ep ; <i32> [#uses=1] 52 %Fp = getelementptr i32* %P, i32 5 ; <i32*> [#uses=1] 53 %F = load i32* %Fp ; <i32> [#uses=1] 54 %Gp = getelementptr i32* %P, i32 6 ; <i32*> [#uses=1] 55 %G = load i32* %Gp ; <i32> [#uses=1] 56 %Hp = getelementptr i32* %P, i32 7 ; <i32*> [#uses=1] 57 %H = load i32* %Hp ; <i32> [#uses=1] 58 %Ip = getelementptr i32* %P, i32 8 ; <i32*> [#uses=1] 59 %I = load i32* %Ip ; <i32> [#uses=1] 60 %Jp = getelementptr i32* %P, i32 9 ; <i32*> [#uses=1] 61 %J = load i32* %Jp ; <i32> [#uses=1] 62 %s1 = mul i32 %A, %B ; <i32> [#uses=1] 63 %s2 = mul i32 %s1, %C ; <i32> [#uses=1] 64 %s3 = mul i32 %s2, %D ; <i32> [#uses=1] 65 %s4 = mul i32 %s3, %E ; <i32> [#uses=1] 66 %s5 = mul i32 %s4, %F ; <i32> [#uses=1] 67 %s6 = mul i32 %s5, %G ; <i32> [#uses=1] 68 %s7 = mul i32 %s6, %H ; <i32> [#uses=1] 69 %s8 = mul i32 %s7, %I ; <i32> [#uses=1] 70 %s9 = mul i32 %s8, %J ; <i32> [#uses=1] 71 ret i32 %s9 72 } 73 74 define i32 @regpressure3(i16* %P, i1 %Cond, i32* %Other) { 75 %A = load i16* %P ; <i16> [#uses=1] 76 %Bp = getelementptr i16* %P, i32 1 ; <i16*> [#uses=1] 77 %B = load i16* %Bp ; <i16> [#uses=1] 78 %Cp = getelementptr i16* %P, i32 2 ; <i16*> [#uses=1] 79 %C = load i16* %Cp ; <i16> [#uses=1] 80 %Dp = getelementptr i16* %P, i32 3 ; <i16*> [#uses=1] 81 %D = load i16* %Dp ; <i16> [#uses=1] 82 %Ep = getelementptr i16* %P, i32 4 ; <i16*> [#uses=1] 83 %E = load i16* %Ep ; <i16> [#uses=1] 84 %Fp = getelementptr i16* %P, i32 5 ; <i16*> [#uses=1] 85 %F = load i16* %Fp ; <i16> [#uses=1] 86 %Gp = getelementptr i16* %P, i32 6 ; <i16*> [#uses=1] 87 %G = load i16* %Gp ; <i16> [#uses=1] 88 %Hp = getelementptr i16* %P, i32 7 ; <i16*> [#uses=1] 89 %H = load i16* %Hp ; <i16> [#uses=1] 90 %Ip = getelementptr i16* %P, i32 8 ; <i16*> [#uses=1] 91 %I = load i16* %Ip ; <i16> [#uses=1] 92 %Jp = getelementptr i16* %P, i32 9 ; <i16*> [#uses=1] 93 %J = load i16* %Jp ; <i16> [#uses=1] 94 %A.upgrd.1 = sext i16 %A to i32 ; <i32> [#uses=1] 95 %B.upgrd.2 = sext i16 %B to i32 ; <i32> [#uses=1] 96 %D.upgrd.3 = sext i16 %D to i32 ; <i32> [#uses=1] 97 %C.upgrd.4 = sext i16 %C to i32 ; <i32> [#uses=1] 98 %E.upgrd.5 = sext i16 %E to i32 ; <i32> [#uses=1] 99 %F.upgrd.6 = sext i16 %F to i32 ; <i32> [#uses=1] 100 %G.upgrd.7 = sext i16 %G to i32 ; <i32> [#uses=1] 101 %H.upgrd.8 = sext i16 %H to i32 ; <i32> [#uses=1] 102 %I.upgrd.9 = sext i16 %I to i32 ; <i32> [#uses=1] 103 %J.upgrd.10 = sext i16 %J to i32 ; <i32> [#uses=1] 104 %s1 = add i32 %A.upgrd.1, %B.upgrd.2 ; <i32> [#uses=1] 105 %s2 = add i32 %C.upgrd.4, %s1 ; <i32> [#uses=1] 106 %s3 = add i32 %D.upgrd.3, %s2 ; <i32> [#uses=1] 107 %s4 = add i32 %E.upgrd.5, %s3 ; <i32> [#uses=1] 108 %s5 = add i32 %F.upgrd.6, %s4 ; <i32> [#uses=1] 109 %s6 = add i32 %G.upgrd.7, %s5 ; <i32> [#uses=1] 110 %s7 = add i32 %H.upgrd.8, %s6 ; <i32> [#uses=1] 111 %s8 = add i32 %I.upgrd.9, %s7 ; <i32> [#uses=1] 112 %s9 = add i32 %J.upgrd.10, %s8 ; <i32> [#uses=1] 113 ret i32 %s9 114 } 115