1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=sse4.1 | FileCheck %s --check-prefix=SSE41 3 4 define double @test1_add(double %A, double %B) { 5 ; SSE41-LABEL: test1_add: 6 ; SSE41: # %bb.0: 7 ; SSE41-NEXT: paddd %xmm1, %xmm0 8 ; SSE41-NEXT: retq 9 %1 = bitcast double %A to <2 x i32> 10 %2 = bitcast double %B to <2 x i32> 11 %add = add <2 x i32> %1, %2 12 %3 = bitcast <2 x i32> %add to double 13 ret double %3 14 } 15 16 define double @test2_add(double %A, double %B) { 17 ; SSE41-LABEL: test2_add: 18 ; SSE41: # %bb.0: 19 ; SSE41-NEXT: paddw %xmm1, %xmm0 20 ; SSE41-NEXT: retq 21 %1 = bitcast double %A to <4 x i16> 22 %2 = bitcast double %B to <4 x i16> 23 %add = add <4 x i16> %1, %2 24 %3 = bitcast <4 x i16> %add to double 25 ret double %3 26 } 27 28 define double @test3_add(double %A, double %B) { 29 ; SSE41-LABEL: test3_add: 30 ; SSE41: # %bb.0: 31 ; SSE41-NEXT: paddb %xmm1, %xmm0 32 ; SSE41-NEXT: retq 33 %1 = bitcast double %A to <8 x i8> 34 %2 = bitcast double %B to <8 x i8> 35 %add = add <8 x i8> %1, %2 36 %3 = bitcast <8 x i8> %add to double 37 ret double %3 38 } 39 40 define double @test1_sub(double %A, double %B) { 41 ; SSE41-LABEL: test1_sub: 42 ; SSE41: # %bb.0: 43 ; SSE41-NEXT: psubd %xmm1, %xmm0 44 ; SSE41-NEXT: retq 45 %1 = bitcast double %A to <2 x i32> 46 %2 = bitcast double %B to <2 x i32> 47 %sub = sub <2 x i32> %1, %2 48 %3 = bitcast <2 x i32> %sub to double 49 ret double %3 50 } 51 52 define double @test2_sub(double %A, double %B) { 53 ; SSE41-LABEL: test2_sub: 54 ; SSE41: # %bb.0: 55 ; SSE41-NEXT: psubw %xmm1, %xmm0 56 ; SSE41-NEXT: retq 57 %1 = bitcast double %A to <4 x i16> 58 %2 = bitcast double %B to <4 x i16> 59 %sub = sub <4 x i16> %1, %2 60 %3 = bitcast <4 x i16> %sub to double 61 ret double %3 62 } 63 64 define double @test3_sub(double %A, double %B) { 65 ; SSE41-LABEL: test3_sub: 66 ; SSE41: # %bb.0: 67 ; SSE41-NEXT: psubb %xmm1, %xmm0 68 ; SSE41-NEXT: retq 69 %1 = bitcast double %A to <8 x i8> 70 %2 = bitcast double %B to <8 x i8> 71 %sub = sub <8 x i8> %1, %2 72 %3 = bitcast <8 x i8> %sub to double 73 ret double %3 74 } 75 76 define double @test1_mul(double %A, double %B) { 77 ; SSE41-LABEL: test1_mul: 78 ; SSE41: # %bb.0: 79 ; SSE41-NEXT: pmulld %xmm1, %xmm0 80 ; SSE41-NEXT: retq 81 %1 = bitcast double %A to <2 x i32> 82 %2 = bitcast double %B to <2 x i32> 83 %mul = mul <2 x i32> %1, %2 84 %3 = bitcast <2 x i32> %mul to double 85 ret double %3 86 } 87 88 define double @test2_mul(double %A, double %B) { 89 ; SSE41-LABEL: test2_mul: 90 ; SSE41: # %bb.0: 91 ; SSE41-NEXT: pmullw %xmm1, %xmm0 92 ; SSE41-NEXT: retq 93 %1 = bitcast double %A to <4 x i16> 94 %2 = bitcast double %B to <4 x i16> 95 %mul = mul <4 x i16> %1, %2 96 %3 = bitcast <4 x i16> %mul to double 97 ret double %3 98 } 99 100 ; There is no legal ISD::MUL with type MVT::v8i16. 101 define double @test3_mul(double %A, double %B) { 102 ; SSE41-LABEL: test3_mul: 103 ; SSE41: # %bb.0: 104 ; SSE41-NEXT: pmovzxbw {{.*#+}} xmm2 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero 105 ; SSE41-NEXT: pmovzxbw {{.*#+}} xmm0 = xmm1[0],zero,xmm1[1],zero,xmm1[2],zero,xmm1[3],zero,xmm1[4],zero,xmm1[5],zero,xmm1[6],zero,xmm1[7],zero 106 ; SSE41-NEXT: pmullw %xmm2, %xmm0 107 ; SSE41-NEXT: pshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,u,u,u,u,u,u,u,u] 108 ; SSE41-NEXT: retq 109 %1 = bitcast double %A to <8 x i8> 110 %2 = bitcast double %B to <8 x i8> 111 %mul = mul <8 x i8> %1, %2 112 %3 = bitcast <8 x i8> %mul to double 113 ret double %3 114 } 115 116 define double @test1_and(double %A, double %B) { 117 ; SSE41-LABEL: test1_and: 118 ; SSE41: # %bb.0: 119 ; SSE41-NEXT: andps %xmm1, %xmm0 120 ; SSE41-NEXT: retq 121 %1 = bitcast double %A to <2 x i32> 122 %2 = bitcast double %B to <2 x i32> 123 %and = and <2 x i32> %1, %2 124 %3 = bitcast <2 x i32> %and to double 125 ret double %3 126 } 127 128 define double @test2_and(double %A, double %B) { 129 ; SSE41-LABEL: test2_and: 130 ; SSE41: # %bb.0: 131 ; SSE41-NEXT: andps %xmm1, %xmm0 132 ; SSE41-NEXT: retq 133 %1 = bitcast double %A to <4 x i16> 134 %2 = bitcast double %B to <4 x i16> 135 %and = and <4 x i16> %1, %2 136 %3 = bitcast <4 x i16> %and to double 137 ret double %3 138 } 139 140 define double @test3_and(double %A, double %B) { 141 ; SSE41-LABEL: test3_and: 142 ; SSE41: # %bb.0: 143 ; SSE41-NEXT: andps %xmm1, %xmm0 144 ; SSE41-NEXT: retq 145 %1 = bitcast double %A to <8 x i8> 146 %2 = bitcast double %B to <8 x i8> 147 %and = and <8 x i8> %1, %2 148 %3 = bitcast <8 x i8> %and to double 149 ret double %3 150 } 151 152 define double @test1_or(double %A, double %B) { 153 ; SSE41-LABEL: test1_or: 154 ; SSE41: # %bb.0: 155 ; SSE41-NEXT: orps %xmm1, %xmm0 156 ; SSE41-NEXT: retq 157 %1 = bitcast double %A to <2 x i32> 158 %2 = bitcast double %B to <2 x i32> 159 %or = or <2 x i32> %1, %2 160 %3 = bitcast <2 x i32> %or to double 161 ret double %3 162 } 163 164 define double @test2_or(double %A, double %B) { 165 ; SSE41-LABEL: test2_or: 166 ; SSE41: # %bb.0: 167 ; SSE41-NEXT: orps %xmm1, %xmm0 168 ; SSE41-NEXT: retq 169 %1 = bitcast double %A to <4 x i16> 170 %2 = bitcast double %B to <4 x i16> 171 %or = or <4 x i16> %1, %2 172 %3 = bitcast <4 x i16> %or to double 173 ret double %3 174 } 175 176 define double @test3_or(double %A, double %B) { 177 ; SSE41-LABEL: test3_or: 178 ; SSE41: # %bb.0: 179 ; SSE41-NEXT: orps %xmm1, %xmm0 180 ; SSE41-NEXT: retq 181 %1 = bitcast double %A to <8 x i8> 182 %2 = bitcast double %B to <8 x i8> 183 %or = or <8 x i8> %1, %2 184 %3 = bitcast <8 x i8> %or to double 185 ret double %3 186 } 187 188 define double @test1_xor(double %A, double %B) { 189 ; SSE41-LABEL: test1_xor: 190 ; SSE41: # %bb.0: 191 ; SSE41-NEXT: xorps %xmm1, %xmm0 192 ; SSE41-NEXT: retq 193 %1 = bitcast double %A to <2 x i32> 194 %2 = bitcast double %B to <2 x i32> 195 %xor = xor <2 x i32> %1, %2 196 %3 = bitcast <2 x i32> %xor to double 197 ret double %3 198 } 199 200 define double @test2_xor(double %A, double %B) { 201 ; SSE41-LABEL: test2_xor: 202 ; SSE41: # %bb.0: 203 ; SSE41-NEXT: xorps %xmm1, %xmm0 204 ; SSE41-NEXT: retq 205 %1 = bitcast double %A to <4 x i16> 206 %2 = bitcast double %B to <4 x i16> 207 %xor = xor <4 x i16> %1, %2 208 %3 = bitcast <4 x i16> %xor to double 209 ret double %3 210 } 211 212 define double @test3_xor(double %A, double %B) { 213 ; SSE41-LABEL: test3_xor: 214 ; SSE41: # %bb.0: 215 ; SSE41-NEXT: xorps %xmm1, %xmm0 216 ; SSE41-NEXT: retq 217 %1 = bitcast double %A to <8 x i8> 218 %2 = bitcast double %B to <8 x i8> 219 %xor = xor <8 x i8> %1, %2 220 %3 = bitcast <8 x i8> %xor to double 221 ret double %3 222 } 223 224 define double @test_fadd(double %A, double %B) { 225 ; SSE41-LABEL: test_fadd: 226 ; SSE41: # %bb.0: 227 ; SSE41-NEXT: addps %xmm1, %xmm0 228 ; SSE41-NEXT: retq 229 %1 = bitcast double %A to <2 x float> 230 %2 = bitcast double %B to <2 x float> 231 %add = fadd <2 x float> %1, %2 232 %3 = bitcast <2 x float> %add to double 233 ret double %3 234 } 235 236 define double @test_fsub(double %A, double %B) { 237 ; SSE41-LABEL: test_fsub: 238 ; SSE41: # %bb.0: 239 ; SSE41-NEXT: subps %xmm1, %xmm0 240 ; SSE41-NEXT: retq 241 %1 = bitcast double %A to <2 x float> 242 %2 = bitcast double %B to <2 x float> 243 %sub = fsub <2 x float> %1, %2 244 %3 = bitcast <2 x float> %sub to double 245 ret double %3 246 } 247 248 define double @test_fmul(double %A, double %B) { 249 ; SSE41-LABEL: test_fmul: 250 ; SSE41: # %bb.0: 251 ; SSE41-NEXT: mulps %xmm1, %xmm0 252 ; SSE41-NEXT: retq 253 %1 = bitcast double %A to <2 x float> 254 %2 = bitcast double %B to <2 x float> 255 %mul = fmul <2 x float> %1, %2 256 %3 = bitcast <2 x float> %mul to double 257 ret double %3 258 } 259 260