1 ; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py 2 ; RUN: llc < %s -mtriple=i686-unknown -mattr=+sse2,-sse4.1 | FileCheck %s --check-prefix=X32 3 ; RUN: llc < %s -mtriple=x86_64-unknown -mattr=+sse2,-sse4.1 | FileCheck %s --check-prefix=X64 4 5 define <4 x float> @t1(float %s, <4 x float> %tmp) nounwind { 6 ; X32-LABEL: t1: 7 ; X32: # BB#0: 8 ; X32-NEXT: movss {{.*#+}} xmm1 = mem[0],zero,zero,zero 9 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 10 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 11 ; X32-NEXT: retl 12 ; 13 ; X64-LABEL: t1: 14 ; X64: # BB#0: 15 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,0],xmm1[2,0] 16 ; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,1],xmm0[2,0] 17 ; X64-NEXT: movaps %xmm1, %xmm0 18 ; X64-NEXT: retq 19 %tmp1 = insertelement <4 x float> %tmp, float %s, i32 3 20 ret <4 x float> %tmp1 21 } 22 23 define <4 x i32> @t2(i32 %s, <4 x i32> %tmp) nounwind { 24 ; X32-LABEL: t2: 25 ; X32: # BB#0: 26 ; X32-NEXT: movd {{.*#+}} xmm1 = mem[0],zero,zero,zero 27 ; X32-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 28 ; X32-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 29 ; X32-NEXT: retl 30 ; 31 ; X64-LABEL: t2: 32 ; X64: # BB#0: 33 ; X64-NEXT: movd %edi, %xmm1 34 ; X64-NEXT: shufps {{.*#+}} xmm1 = xmm1[0,0],xmm0[2,0] 35 ; X64-NEXT: shufps {{.*#+}} xmm0 = xmm0[0,1],xmm1[2,0] 36 ; X64-NEXT: retq 37 %tmp1 = insertelement <4 x i32> %tmp, i32 %s, i32 3 38 ret <4 x i32> %tmp1 39 } 40 41 define <2 x double> @t3(double %s, <2 x double> %tmp) nounwind { 42 ; X32-LABEL: t3: 43 ; X32: # BB#0: 44 ; X32-NEXT: movhpd {{.*#+}} xmm0 = xmm0[0],mem[0] 45 ; X32-NEXT: retl 46 ; 47 ; X64-LABEL: t3: 48 ; X64: # BB#0: 49 ; X64-NEXT: unpcklpd {{.*#+}} xmm1 = xmm1[0],xmm0[0] 50 ; X64-NEXT: movapd %xmm1, %xmm0 51 ; X64-NEXT: retq 52 %tmp1 = insertelement <2 x double> %tmp, double %s, i32 1 53 ret <2 x double> %tmp1 54 } 55 56 define <8 x i16> @t4(i16 %s, <8 x i16> %tmp) nounwind { 57 ; X32-LABEL: t4: 58 ; X32: # BB#0: 59 ; X32-NEXT: pinsrw $5, {{[0-9]+}}(%esp), %xmm0 60 ; X32-NEXT: retl 61 ; 62 ; X64-LABEL: t4: 63 ; X64: # BB#0: 64 ; X64-NEXT: pinsrw $5, %edi, %xmm0 65 ; X64-NEXT: retq 66 %tmp1 = insertelement <8 x i16> %tmp, i16 %s, i32 5 67 ret <8 x i16> %tmp1 68 } 69