Home | History | Annotate | Download | only in X86

Lines Matching full:arg1

69   %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
70 %res = add <32 x i8> %arg0, %arg1
86 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
87 %res = add <16 x i16> %arg0, %arg1
103 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
104 %res = add <8 x i32> %arg0, %arg1
134 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
135 %res = call <32 x i8> @llvm.x86.avx2.padds.b(<32 x i8> %arg0, <32 x i8> %arg1)
152 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
153 %res = call <16 x i16> @llvm.x86.avx2.padds.w(<16 x i16> %arg0, <16 x i16> %arg1)
170 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
171 %res = call <32 x i8> @llvm.x86.avx2.paddus.b(<32 x i8> %arg0, <32 x i8> %arg1)
188 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
189 %res = call <16 x i16> @llvm.x86.avx2.paddus.w(<16 x i16> %arg0, <16 x i16> %arg1)
206 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
207 %shuf = shufflevector <32 x i8> %arg0, <32 x i8> %arg1, <32 x i32> <i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 32, i32 33, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23, i32 24, i32 25, i32 26, i32 27, i32 28, i32 29, i32 30, i32 31, i32 48, i32 49>
223 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
224 %shuf = shufflevector <32 x i8> %arg0, <32 x i8> %arg1, <32 x i32> <i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 32, i32 17, i32 18, i32 19, i32 20, i32 21, i32 22, i32 23, i32 24, i32 25, i32 26, i32 27, i32 28, i32 29, i32 30, i32 31, i32 48>
273 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
274 %res = call <32 x i8> @llvm.x86.avx2.pavg.b(<32 x i8> %arg0, <32 x i8> %arg1)
291 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
292 %res = call <16 x i16> @llvm.x86.avx2.pavg.w(<16 x i16> %arg0, <16 x i16> %arg1)
309 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
310 %shuf = shufflevector <16 x i16> %arg0, <16 x i16> %arg1, <16 x i32> <i32 0, i32 17, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 25, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
326 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
327 %shuf = shufflevector <4 x i32> %arg0, <4 x i32> %arg1, <4 x i32> <i32 4, i32 1, i32 6, i32 3>
343 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
344 %shuf = shufflevector <8 x i32> %arg0, <8 x i32> %arg1, <8 x i32> <i32 8, i32 1, i32 10, i32 3, i32 12, i32 13, i32 6, i32 7>
360 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
362 %call = call <32 x i8> @llvm.x86.avx2.pblendvb(<32 x i8> %arg0, <32 x i8> %arg1, <32 x i8> %arg2)
605 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
606 %cmp = icmp eq <32 x i8> %arg0, %arg1
623 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
624 %cmp = icmp eq <16 x i16> %arg0, %arg1
641 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
642 %cmp = icmp eq <8 x i32> %arg0, %arg1
674 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
675 %cmp = icmp sgt <32 x i8> %arg0, %arg1
692 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
693 %cmp = icmp sgt <16 x i16> %arg0, %arg1
710 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
711 %cmp = icmp sgt <8 x i32> %arg0, %arg1
951 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
952 %res = call <16 x i16> @llvm.x86.avx2.phadd.w(<16 x i16> %arg0, <16 x i16> %arg1)
969 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
970 %res = call <8 x i32> @llvm.x86.avx2.phadd.d(<8 x i32> %arg0, <8 x i32> %arg1)
987 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
988 %res = call <16 x i16> @llvm.x86.avx2.phadd.sw(<16 x i16> %arg0, <16 x i16> %arg1)
1005 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
1006 %res = call <16 x i16> @llvm.x86.avx2.phsub.w(<16 x i16> %arg0, <16 x i16> %arg1)
1023 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
1024 %res = call <8 x i32> @llvm.x86.avx2.phsub.d(<8 x i32> %arg0, <8 x i32> %arg1)
1041 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
1042 %res = call <16 x i16> @llvm.x86.avx2.phsub.sw(<16 x i16> %arg0, <16 x i16> %arg1)
1064 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
1066 %call = call <4 x i32> @llvm.x86.avx2.gather.d.d(<4 x i32> undef, i8* %arg0, <4 x i32> %arg1, <4 x i32> %mask, i8 2)
1084 %arg1 = bitcast i32 *%a1 to i8*
1087 %call = call <4 x i32> @llvm.x86.avx2.gather.d.d(<4 x i32> %arg0, i8* %arg1, <4 x i32> %arg2, <4 x i32> %arg3, i8 2)
1108 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
1110 %call = call <8 x i32> @llvm.x86.avx2.gather.d.d.256(<8 x i32> undef, i8* %arg0, <8 x i32> %arg1, <8 x i32> %mask, i8 2)
1128 %arg1 = bitcast i32 *%a1 to i8*
1131 %call = call <8 x i32> @llvm.x86.avx2.gather.d.d.256(<8 x i32> %arg0, i8* %arg1, <8 x i32> %arg2, <8 x i32> %arg3, i8 2)
1152 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
1153 %res = call <2 x i64> @llvm.x86.avx2.gather.d.q(<2 x i64> undef, i8* %arg0, <4 x i32> %arg1, <2 x i64> <i64 -1, i64 -1>, i8 2)
1169 %arg1 = bitcast i64 *%a1 to i8*
1171 %res = call <2 x i64> @llvm.x86.avx2.gather.d.q(<2 x i64> %a0, i8* %arg1, <4 x i32> %arg2, <2 x i64> %a3, i8 2)
1191 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
1192 %res = call <4 x i64> @llvm.x86.avx2.gather.d.q.256(<4 x i64> undef, i8* %arg0, <4 x i32> %arg1, <4 x i64> <i64 -1, i64 -1, i64 -1, i64 -1>, i8 2)
1208 %arg1 = bitcast i64 *%a1 to i8*
1210 %res = call <4 x i64> @llvm.x86.avx2.gather.d.q.256(<4 x i64> %a0, i8* %arg1, <4 x i32> %arg2, <4 x i64> %a3, i8 2)
1230 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
1234 %res = call <2 x double> @llvm.x86.avx2.gather.d.pd(<2 x double> undef, i8* %arg0, <4 x i32> %arg1, <2 x double> %mask, i8 2)
1250 %arg1 = bitcast double *%a1 to i8*
1252 %res = call <2 x double> @llvm.x86.avx2.gather.d.pd(<2 x double> %a0, i8* %arg1, <4 x i32> %arg2, <2 x double> %a3, i8 2)
1274 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
1276 %res = call <4 x double> @llvm.x86.avx2.gather.d.pd.256(<4 x double> undef, i8* %arg0, <4 x i32> %arg1, <4 x double> %mask, i8 2)
1292 %arg1 = bitcast double *%a1 to i8*
1294 %res = call <4 x double> @llvm.x86.avx2.gather.d.pd.256(<4 x double> %a0, i8* %arg1, <4 x i32> %arg2, <4 x double> %a3, i8 2)
1314 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
1318 %call = call <4 x float> @llvm.x86.avx2.gather.d.ps(<4 x float> undef, i8* %arg0, <4 x i32> %arg1, <4 x float> %mask, i8 2)
1334 %arg1 = bitcast float *%a1 to i8*
1336 %call = call <4 x float> @llvm.x86.avx2.gather.d.ps(<4 x float> %a0, i8* %arg1, <4 x i32> %arg2, <4 x float> %a3, i8 2)
1358 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
1360 %call = call <8 x float> @llvm.x86.avx2.gather.d.ps.256(<8 x float> undef, i8* %arg0, <8 x i32> %arg1, <8 x float> %mask, i8 2)
1376 %arg1 = bitcast float *%a1 to i8*
1378 %call = call <8 x float> @llvm.x86.avx2.gather.d.ps.256(<8 x float> %a0, i8* %arg1, <8 x i32> %arg2, <8 x float> %a3, i8 2)
1417 %arg1 = bitcast i32 *%a1 to i8*
1419 %call = call <4 x i32> @llvm.x86.avx2.gather.q.d(<4 x i32> %arg0, i8* %arg1, <2 x i64> %a2, <4 x i32> %arg3, i8 2)
1463 %arg1 = bitcast i32 *%a1 to i8*
1465 %call = call <4 x i32> @llvm.x86.avx2.gather.q.d.256(<4 x i32> %arg0, i8* %arg1, <4 x i64> %a2, <4 x i32> %arg3, i8 2)
1502 %arg1 = bitcast i64 *%a1 to i8*
1503 %call = call <2 x i64> @llvm.x86.avx2.gather.q.q(<2 x i64> %a0, i8* %arg1, <2 x i64> %a2, <2 x i64> %a3, i8 2)
1539 %arg1 = bitcast i64 *%a1 to i8*
1540 %call = call <4 x i64> @llvm.x86.avx2.gather.q.q.256(<4 x i64> %a0, i8* %arg1, <4 x i64> %a2, <4 x i64> %a3, i8 2)
1579 %arg1 = bitcast double *%a1 to i8*
1580 %call = call <2 x double> @llvm.x86.avx2.gather.q.pd(<2 x double> %a0, i8* %arg1, <2 x i64> %a2, <2 x double> %a3, i8 2)
1619 %arg1 = bitcast i64 *%a1 to i8*
1620 %call = call <4 x double> @llvm.x86.avx2.gather.q.pd.256(<4 x double> %a0, i8* %arg1, <4 x i64> %a2, <4 x double> %a3, i8 2)
1659 %arg1 = bitcast float *%a1 to i8*
1660 %call = call <4 x float> @llvm.x86.avx2.gather.q.ps(<4 x float> %a0, i8* %arg1, <2 x i64> %a2, <4 x float> %a3, i8 2)
1703 %arg1 = bitcast float *%a1 to i8*
1704 %call = call <4 x float> @llvm.x86.avx2.gather.q.ps.256(<4 x float> %a0, i8* %arg1, <4 x i64> %a2, <4 x float> %a3, i8 2)
1751 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
1752 %res = call <8 x i32> @llvm.x86.avx2.pmadd.wd(<16 x i16> %arg0, <16 x i16> %arg1)
1769 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
1770 %res = call <16 x i16> @llvm.x86.avx2.pmadd.ub.sw(<32 x i8> %arg0, <32 x i8> %arg1)
1788 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
1789 %call = call <4 x i32> @llvm.x86.avx2.maskload.d(i8* %arg0, <4 x i32> %arg1)
1807 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
1808 %call = call <8 x i32> @llvm.x86.avx2.maskload.d.256(i8* %arg0, <8 x i32> %arg1)
1860 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
1862 call void @llvm.x86.avx2.maskstore.d(i8* %arg0, <4 x i32> %arg1, <4 x i32> %arg2)
1881 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
1883 call void @llvm.x86.avx2.maskstore.d.256(i8* %arg0, <8 x i32> %arg1, <8 x i32> %arg2)
1935 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
1936 %cmp = icmp sgt <32 x i8> %arg0, %arg1
1937 %sel = select <32 x i1> %cmp, <32 x i8> %arg0, <32 x i8> %arg1
1953 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
1954 %cmp = icmp sgt <16 x i16> %arg0, %arg1
1955 %sel = select <16 x i1> %cmp, <16 x i16> %arg0, <16 x i16> %arg1
1971 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
1972 %cmp = icmp sgt <8 x i32> %arg0, %arg1
1973 %sel = select <8 x i1> %cmp, <8 x i32> %arg0, <8 x i32> %arg1
1989 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
1990 %cmp = icmp ugt <32 x i8> %arg0, %arg1
1991 %sel = select <32 x i1> %cmp, <32 x i8> %arg0, <32 x i8> %arg1
2007 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2008 %cmp = icmp ugt <16 x i16> %arg0, %arg1
2009 %sel = select <16 x i1> %cmp, <16 x i16> %arg0, <16 x i16> %arg1
2025 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2026 %cmp = icmp ugt <8 x i32> %arg0, %arg1
2027 %sel = select <8 x i1> %cmp, <8 x i32> %arg0, <8 x i32> %arg1
2043 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
2044 %cmp = icmp slt <32 x i8> %arg0, %arg1
2045 %sel = select <32 x i1> %cmp, <32 x i8> %arg0, <32 x i8> %arg1
2061 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2062 %cmp = icmp slt <16 x i16> %arg0, %arg1
2063 %sel = select <16 x i1> %cmp, <16 x i16> %arg0, <16 x i16> %arg1
2079 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2080 %cmp = icmp slt <8 x i32> %arg0, %arg1
2081 %sel = select <8 x i1> %cmp, <8 x i32> %arg0, <8 x i32> %arg1
2097 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
2098 %cmp = icmp ult <32 x i8> %arg0, %arg1
2099 %sel = select <32 x i1> %cmp, <32 x i8> %arg0, <32 x i8> %arg1
2115 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2116 %cmp = icmp ult <16 x i16> %arg0, %arg1
2117 %sel = select <16 x i1> %cmp, <16 x i16> %arg0, <16 x i16> %arg1
2133 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2134 %cmp = icmp ult <8 x i32> %arg0, %arg1
2135 %sel = select <8 x i1> %cmp, <8 x i32> %arg0, <8 x i32> %arg1
2169 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
2170 %call = call <16 x i16> @llvm.x86.avx2.mpsadbw(<32 x i8> %arg0, <32 x i8> %arg1, i8 3)
2187 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2188 %res = call <4 x i64> @llvm.x86.avx2.pmul.dq(<8 x i32> %arg0, <8 x i32> %arg1)
2204 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2205 %res = call <4 x i64> @llvm.x86.avx2.pmulu.dq(<8 x i32> %arg0, <8 x i32> %arg1)
2221 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2222 arg1)
2239 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2240 %res = call <16 x i16> @llvm.x86.avx2.pmulhu.w(<16 x i16> %arg0, <16 x i16> %arg1)
2257 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2258 %res = call <16 x i16> @llvm.x86.avx2.pmul.hr.sw(<16 x i16> %arg0, <16 x i16> %arg1)
2275 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2276 %res = mul <16 x i16> %arg0, %arg1
2292 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2293 %res = mul <8 x i32> %arg0, %arg1
2323 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2324 %call = call <32 x i8> @llvm.x86.avx2.packsswb(<16 x i16> %arg0, <16 x i16> %arg1)
2341 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2342 %call = call <16 x i16> @llvm.x86.avx2.packssdw(<8 x i32> %arg0, <8 x i32> %arg1)
2359 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2360 %call = call <32 x i8> @llvm.x86.avx2.packuswb(<16 x i16> %arg0, <16 x i16> %arg1)
2377 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2378 %call = call <16 x i16> @llvm.x86.avx2.packusdw(<8 x i32> %arg0, <8 x i32> %arg1)
2438 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2439 %call = call <8 x i32> @llvm.x86.avx2.permd(<8 x i32> %arg0, <8 x i32> %arg1)
2455 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2456 %res = call <8 x float> @llvm.x86.avx2.permps(<8 x float> %a0, <8 x i32> %arg1)
2472 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
2473 %res = call <4 x i64> @llvm.x86.avx2.psad.bw(<32 x i8> %arg0, <32 x i8> %arg1)
2505 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
2506 %shuf = call <32 x i8> @llvm.x86.avx2.pshuf.b(<32 x i8> %arg0, <32 x i8> %arg1)
2555 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
2556 %call = call <32 x i8> @llvm.x86.avx2.psign.b(<32 x i8> %arg0, <32 x i8> %arg1)
2573 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
2574 %call = call <16 x i16> @llvm.x86.avx2.psign.w(<16 x i16> %arg0, <16 x i16> %arg1)
2591 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2592 %call = call <8 x i32> @llvm.x86.avx2.psign.d(<8 x i32> %arg0, <8 x i32> %arg1)
2609 %arg1 = bitcast <2 x i64> %a1 to <8 x i16>
2610 %res = call <16 x i16> @llvm.x86.avx2.psll.w(<16 x i16> %arg0, <8 x i16> %arg1)
2627 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
2628 %res = call <8 x i32> @llvm.x86.avx2.psll.d(<8 x i32> %arg0, <4 x i32> %arg1)
2725 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
2726 %res = call <4 x i32> @llvm.x86.avx2.psllv.d(<4 x i32> %arg0, <4 x i32> %arg1)
2743 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2744 %res = call <8 x i32> @llvm.x86.avx2.psllv.d.256(<8 x i32> %arg0, <8 x i32> %arg1)
2791 %arg1 = bitcast <2 x i64> %a1 to <8 x i16>
2792 %res = call <16 x i16> @llvm.x86.avx2.psra.w(<16 x i16> %arg0, <8 x i16> %arg1)
2809 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
2810 %res = call <8 x i32> @llvm.x86.avx2.psra.d(<8 x i32> %arg0, <4 x i32> %arg1)
2861 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
2862 %res = call <4 x i32> @llvm.x86.avx2.psrav.d(<4 x i32> %arg0, <4 x i32> %arg1)
2879 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
2880 %res = call <8 x i32> @llvm.x86.avx2.psrav.d.256(<8 x i32> %arg0, <8 x i32> %arg1)
2897 %arg1 = bitcast <2 x i64> %a1 to <8 x i16>
2898 %res = call <16 x i16> @llvm.x86.avx2.psrl.w(<16 x i16> %arg0, <8 x i16> %arg1)
2915 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
2916 %res = call <8 x i32> @llvm.x86.avx2.psrl.d(<8 x i32> %arg0, <4 x i32> %arg1)
3013 %arg1 = bitcast <2 x i64> %a1 to <4 x i32>
3014 %res = call <4 x i32> @llvm.x86.avx2.psrlv.d(<4 x i32> %arg0, <4 x i32> %arg1)
3031 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
3032 %res = call <8 x i32> @llvm.x86.avx2.psrlv.d.256(<8 x i32> %arg0, <8 x i32> %arg1)
3096 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
3097 %res = sub <32 x i8> %arg0, %arg1
3113 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
3114 %res = sub <16 x i16> %arg0, %arg1
3130 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
3131 %res = sub <8 x i32> %arg0, %arg1
3161 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
3162 %res = call <32 x i8> @llvm.x86.avx2.psubs.b(<32 x i8> %arg0, <32 x i8> %arg1)
3179 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
3180 %res = call <16 x i16> @llvm.x86.avx2.psubs.w(<16 x i16> %arg0, <16 x i16> %arg1)
3197 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
3198 %res = call <32 x i8> @llvm.x86.avx2.psubus.b(<32 x i8> %arg0, <32 x i8> %arg1)
3215 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
3216 %res = call <16 x i16> @llvm.x86.avx2.psubus.w(<16 x i16> %arg0, <16 x i16> %arg1)
3233 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
3234 %res = shufflevector <32 x i8> %arg0, <32 x i8> %arg1, <32 x i32> <i32 8, i32 40, i32 9, i32 41, i32 10, i32 42, i32 11, i32 43, i32 12, i32 44, i32 13, i32 45, i32 14, i32 46, i32 15, i32 47, i32 24, i32 56, i32 25, i32 57, i32 26, i32 58, i32 27, i32 59, i32 28, i32 60, i32 29, i32 61, i32 30, i32 62, i32 31, i32 63>
3250 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
3251 %res = shufflevector <16 x i16> %arg0, <16 x i16> %arg1, <16 x i32> <i32 4, i32 20, i32 5, i32 21, i32 6, i32 22, i32 7, i32 23, i32 12, i32 28, i32 13, i32 29, i32 14, i32 30, i32 15, i32 31>
3267 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
3268 %res = shufflevector <8 x i32> %arg0, <8 x i32> %arg1, <8 x i32> <i32 2, i32 10, i32 3, i32 11, i32 6, i32 14, i32 7, i32 15>
3298 %arg1 = bitcast <4 x i64> %a1 to <32 x i8>
3299 %res = shufflevector <32 x i8> %arg0, <32 x i8> %arg1, <32 x i32> <i32 0, i32 32, i32 1, i32 33, i32 2, i32 34, i32 3, i32 35, i32 4, i32 36, i32 5, i32 37, i32 6, i32 38, i32 7, i32 39, i32 16, i32 48, i32 17, i32 49, i32 18, i32 50, i32 19, i32 51, i32 20, i32 52, i32 21, i32 53, i32 22, i32 54, i32 23, i32 55>
3315 %arg1 = bitcast <4 x i64> %a1 to <16 x i16>
3316 %res = shufflevector <16 x i16> %arg0, <16 x i16> %arg1, <16 x i32> <i32 0, i32 16, i32 1, i32 17, i32 2, i32 18, i32 3, i32 19, i32 8, i32 24, i32 9, i32 25, i32 10, i32 26, i32 11, i32 27>
3332 %arg1 = bitcast <4 x i64> %a1 to <8 x i32>
3333 %res = shufflevector <8 x i32> %arg0, <8 x i32> %arg1, <8 x i32> <i32 0, i32 8, i32 1, i32 9, i32 4, i32 12, i32 5, i32 13>