HomeSort by relevance Sort by last modified time
    Searched full:sse41 (Results 26 - 50 of 212) sorted by null

12 3 4 5 6 7 8 9

  /external/llvm/test/CodeGen/X86/
vector-rotate-128.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
36 ; SSE41-LABEL: var_rotate_v2i64:
37 ; SSE41: # BB#0:
38 ; SSE41-NEXT: movdqa {{.*#+}} xmm2 = [64,64]
39 ; SSE41-NEXT: psubq %xmm1, %xmm2
40 ; SSE41-NEXT: movdqa %xmm0, %xmm3
41 ; SSE41-NEXT: psllq %xmm1, %xmm3
42 ; SSE41-NEXT: pshufd {{.*#+}} xmm1 = xmm1[2,3,0,1]
43 ; SSE41-NEXT: movdqa %xmm0, %xmm4
44 ; SSE41-NEXT: psllq %xmm1, %xmm
    [all...]
vector-idiv.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
47 ; SSE41-LABEL: PR20355:
48 ; SSE41: # BB#0: # %entry
49 ; SSE41-NEXT: movdqa {{.*#+}} xmm1 = [1431655766,1431655766,1431655766,1431655766]
50 ; SSE41-NEXT: pshufd {{.*#+}} xmm2 = xmm1[1,1,3,3]
51 ; SSE41-NEXT: pshufd {{.*#+}} xmm3 = xmm0[1,1,3,3]
52 ; SSE41-NEXT: pmuldq %xmm2, %xmm3
53 ; SSE41-NEXT: pmuldq %xmm1, %xmm0
54 ; SSE41-NEXT: pshufd {{.*#+}} xmm1 = xmm0[1,1,3,3]
55 ; SSE41-NEXT: pblendw {{.*#+}} xmm1 = xmm1[0,1],xmm3[2,3],xmm1[4,5],xmm3[6,7
    [all...]
vec_minmax_sint.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
34 ; SSE41-LABEL: max_gt_v2i64:
35 ; SSE41: # BB#0:
36 ; SSE41-NEXT: movdqa %xmm0, %xmm2
37 ; SSE41-NEXT: movdqa {{.*#+}} xmm0 = [2147483648,0,2147483648,0]
38 ; SSE41-NEXT: movdqa %xmm1, %xmm3
39 ; SSE41-NEXT: pxor %xmm0, %xmm3
40 ; SSE41-NEXT: pxor %xmm2, %xmm0
41 ; SSE41-NEXT: movdqa %xmm0, %xmm4
42 ; SSE41-NEXT: pcmpgtd %xmm3, %xmm
    [all...]
vec_minmax_uint.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
34 ; SSE41-LABEL: max_gt_v2i64:
35 ; SSE41: # BB#0:
36 ; SSE41-NEXT: movdqa %xmm0, %xmm2
37 ; SSE41-NEXT: movdqa {{.*#+}} xmm0 = [2147483648,2147483648,2147483648,2147483648]
38 ; SSE41-NEXT: movdqa %xmm1, %xmm3
39 ; SSE41-NEXT: pxor %xmm0, %xmm3
40 ; SSE41-NEXT: pxor %xmm2, %xmm0
41 ; SSE41-NEXT: movdqa %xmm0, %xmm4
42 ; SSE41-NEXT: pcmpgtd %xmm3, %xmm
    [all...]
vec_cmp_sint-128.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
24 ; SSE41-LABEL: eq_v2i64:
25 ; SSE41: # BB#0:
26 ; SSE41-NEXT: pcmpeqq %xmm1, %xmm0
27 ; SSE41-NEXT: retq
122 ; SSE41-LABEL: ne_v2i64:
123 ; SSE41: # BB#0:
124 ; SSE41-NEXT: pcmpeqq %xmm1, %xmm0
125 ; SSE41-NEXT: pcmpeqd %xmm1, %xmm1
126 ; SSE41-NEXT: pxor %xmm1, %xmm
    [all...]
commute-blend-sse41.ll 10 %2 = call <8 x i16> @llvm.x86.sse41.pblendw(<8 x i16> %1, <8 x i16> %a, i8 17)
13 declare <8 x i16> @llvm.x86.sse41.pblendw(<8 x i16>, <8 x i16>, i8) nounwind readnone
21 %2 = call <4 x float> @llvm.x86.sse41.blendps(<4 x float> %1, <4 x float> %a, i8 5)
24 declare <4 x float> @llvm.x86.sse41.blendps(<4 x float>, <4 x float>, i8) nounwind readnone
32 %2 = call <2 x double> @llvm.x86.sse41.blendpd(<2 x double> %1, <2 x double> %a, i8 1)
35 declare <2 x double> @llvm.x86.sse41.blendpd(<2 x double>, <2 x double>, i8) nounwind readnone
sse41-intrinsics-x86-upgrade.ll 12 %res = call <2 x double> @llvm.x86.sse41.blendpd(<2 x double> %a0, <2 x double> %a1, i32 6) ; <<2 x double>> [#uses=1]
15 declare <2 x double> @llvm.x86.sse41.blendpd(<2 x double>, <2 x double>, i32) nounwind readnone
23 %res = call <4 x float> @llvm.x86.sse41.blendps(<4 x float> %a0, <4 x float> %a1, i32 7) ; <<4 x float>> [#uses=1]
26 declare <4 x float> @llvm.x86.sse41.blendps(<4 x float>, <4 x float>, i32) nounwind readnone
34 %res = call <2 x double> @llvm.x86.sse41.dppd(<2 x double> %a0, <2 x double> %a1, i32 7) ; <<2 x double>> [#uses=1]
37 declare <2 x double> @llvm.x86.sse41.dppd(<2 x double>, <2 x double>, i32) nounwind readnone
45 %res = call <4 x float> @llvm.x86.sse41.dpps(<4 x float> %a0, <4 x float> %a1, i32 7) ; <<4 x float>> [#uses=1]
48 declare <4 x float> @llvm.x86.sse41.dpps(<4 x float>, <4 x float>, i32) nounwind readnone
56 %res = call <4 x float> @llvm.x86.sse41.insertps(<4 x float> %a0, <4 x float> %a1, i32 17) ; <<4 x float>> [#uses=1]
59 declare <4 x float> @llvm.x86.sse41.insertps(<4 x float>, <4 x float>, i32) nounwind readnon
    [all...]
vector-shift-shl-128.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
28 ; SSE41-LABEL: var_shift_v2i64:
29 ; SSE41: # BB#0:
30 ; SSE41-NEXT: movdqa %xmm0, %xmm2
31 ; SSE41-NEXT: psllq %xmm1, %xmm2
32 ; SSE41-NEXT: pshufd {{.*#+}} xmm1 = xmm1[2,3,0,1]
33 ; SSE41-NEXT: psllq %xmm1, %xmm0
34 ; SSE41-NEXT: pblendw {{.*#+}} xmm0 = xmm2[0,1,2,3],xmm0[4,5,6,7]
35 ; SSE41-NEXT: retq
95 ; SSE41-LABEL: var_shift_v4i32
    [all...]
vector-popcnt-128.ll 5 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
68 ; SSE41-LABEL: testv2i64:
69 ; SSE41: # BB#0:
70 ; SSE41-NEXT: movdqa {{.*#+}} xmm1 = [15,15,15,15,15,15,15,15,15,15,15,15,15,15,15,15]
71 ; SSE41-NEXT: movdqa %xmm0, %xmm2
72 ; SSE41-NEXT: pand %xmm1, %xmm2
73 ; SSE41-NEXT: movdqa {{.*#+}} xmm3 = [0,1,1,2,1,2,2,3,1,2,2,3,2,3,3,4]
74 ; SSE41-NEXT: movdqa %xmm3, %xmm4
75 ; SSE41-NEXT: pshufb %xmm2, %xmm4
76 ; SSE41-NEXT: psrlw $4, %xmm
    [all...]
vec_uint_to_fp.ll 2 ; RUN: llc < %s -mtriple=x86_64-apple-macosx -mattr=+sse4.1 | FileCheck --check-prefix=CHECK --check-prefix=SSE41 --check-prefix=CST %s
56 ; SSE41: movdqa [[LOWCSTADDR]](%rip), [[LOWVEC:%xmm[0-9]+]]
57 ; SSE41-NEXT: pblendw $85, %xmm0, [[LOWVEC]]
58 ; SSE41-NEXT: psrld $16, %xmm0
59 ; SSE41-NEXT: pblendw $170, [[HIGHCSTADDR]](%rip), %xmm0
60 ; SSE41-NEXT: addps [[MAGICCSTADDR]](%rip), %xmm0
61 ; SSE41-NEXT: addps [[LOWVEC]], %xmm0
62 ; SSE41-NEXT: retq
122 ; SSE41: movdqa {{.*#+}} [[LOWCST:xmm[0-9]+]] = [1258291200,1258291200,1258291200,1258291200]
123 ; SSE41-NEXT: movdqa %xmm0, [[VECLOW:%xmm[0-9]+]
    [all...]
vec_cmp_uint-128.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
24 ; SSE41-LABEL: eq_v2i64:
25 ; SSE41: # BB#0:
26 ; SSE41-NEXT: pcmpeqq %xmm1, %xmm0
27 ; SSE41-NEXT: retq
122 ; SSE41-LABEL: ne_v2i64:
123 ; SSE41: # BB#0:
124 ; SSE41-NEXT: pcmpeqq %xmm1, %xmm0
125 ; SSE41-NEXT: pcmpeqd %xmm1, %xmm1
126 ; SSE41-NEXT: pxor %xmm1, %xmm
    [all...]
pmul.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
26 ; SSE41-LABEL: mul_v16i8c:
27 ; SSE41: # BB#0: # %entry
28 ; SSE41-NEXT: pmovsxbw %xmm0, %xmm1
29 ; SSE41-NEXT: pmovsxbw {{.*}}(%rip), %xmm2
30 ; SSE41-NEXT: pmullw %xmm2, %xmm1
31 ; SSE41-NEXT: movdqa {{.*#+}} xmm3 = [255,255,255,255,255,255,255,255]
32 ; SSE41-NEXT: pand %xmm3, %xmm1
33 ; SSE41-NEXT: pshufd {{.*#+}} xmm0 = xmm0[2,3,0,1]
34 ; SSE41-NEXT: pmovsxbw %xmm0, %xmm
    [all...]
pr20088.ll 3 declare <16 x i8> @llvm.x86.sse41.pblendvb(<16 x i8>, <16 x i8>, <16 x i8>)
7 %res = call <16 x i8> @llvm.x86.sse41.pblendvb(<16 x i8> zeroinitializer, <16 x i8> <i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1, i8 1>, <16 x i8> %x)
combine-64bit-vec-binop.ll 1 ; RUN: llc < %s -march=x86-64 -mcpu=corei7 -mtriple=x86_64-unknown-linux-gnu | FileCheck %s -check-prefix=CHECK -check-prefix=SSE41
13 ; SSE41: paddd
26 ; SSE41: paddw
38 ; SSE41: paddb
51 ; SSE41: psubd
64 ; SSE41: psubw
77 ; SSE41: psubb
90 ; SSE41: pmulld
103 ; SSE41: pmullw
129 ; SSE41: andp
    [all...]
vec_setcc.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
48 ; SSE41-LABEL: v8i16_icmp_uge:
49 ; SSE41: # BB#0:
50 ; SSE41-NEXT: pmaxuw %xmm0, %xmm1
51 ; SSE41-NEXT: pcmpeqw %xmm1, %xmm0
52 ; SSE41-NEXT: retq
72 ; SSE41-LABEL: v8i16_icmp_ule:
73 ; SSE41: # BB#0:
74 ; SSE41-NEXT: pminuw %xmm0, %xmm1
75 ; SSE41-NEXT: pcmpeqw %xmm1, %xmm
    [all...]
pmovext.ll 13 %4 = tail call <8 x i16> @llvm.x86.sse41.pmovzxbw(<16 x i8> %3) nounwind
20 declare <8 x i16> @llvm.x86.sse41.pmovzxbw(<16 x i8>) nounwind readnone
31 %tmp2 = tail call <4 x i32> @llvm.x86.sse41.pmovzxwd(<8 x i16> %tmp1) nounwind
41 %tmp2 = tail call <8 x i16> @llvm.x86.sse41.pmovzxbw(<16 x i8> %tmp1)
45 declare <4 x i32> @llvm.x86.sse41.pmovzxwd(<8 x i16>) nounwind readnone
vector-shift-ashr-128.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
36 ; SSE41-LABEL: var_shift_v2i64:
37 ; SSE41: # BB#0:
38 ; SSE41-NEXT: movdqa {{.*#+}} xmm2 = [9223372036854775808,9223372036854775808]
39 ; SSE41-NEXT: movdqa %xmm2, %xmm3
40 ; SSE41-NEXT: psrlq %xmm1, %xmm3
41 ; SSE41-NEXT: pshufd {{.*#+}} xmm4 = xmm1[2,3,0,1]
42 ; SSE41-NEXT: psrlq %xmm4, %xmm2
43 ; SSE41-NEXT: pblendw {{.*#+}} xmm2 = xmm3[0,1,2,3],xmm2[4,5,6,7]
44 ; SSE41-NEXT: movdqa %xmm0, %xmm
    [all...]
vector-shift-lshr-128.ll 3 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
28 ; SSE41-LABEL: var_shift_v2i64:
29 ; SSE41: # BB#0:
30 ; SSE41-NEXT: movdqa %xmm0, %xmm2
31 ; SSE41-NEXT: psrlq %xmm1, %xmm2
32 ; SSE41-NEXT: pshufd {{.*#+}} xmm1 = xmm1[2,3,0,1]
33 ; SSE41-NEXT: psrlq %xmm1, %xmm0
34 ; SSE41-NEXT: pblendw {{.*#+}} xmm0 = xmm2[0,1,2,3],xmm0[4,5,6,7]
35 ; SSE41-NEXT: retq
106 ; SSE41-LABEL: var_shift_v4i32
    [all...]
vector-shuffle-variable-128.ll 4 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
93 ; SSE41-LABEL: var_shuffle_v4f32_v4f32_xxxx_i32:
94 ; SSE41: # BB#0:
95 ; SSE41-NEXT: movslq %edi, %rax
96 ; SSE41-NEXT: movslq %esi, %rsi
97 ; SSE41-NEXT: movslq %edx, %rdx
98 ; SSE41-NEXT: movaps %xmm0, -{{[0-9]+}}(%rsp)
99 ; SSE41-NEXT: movslq %ecx, %rcx
100 ; SSE41-NEXT: movss {{.*#+}} xmm0 = mem[0],zero,zero,zero
101 ; SSE41-NEXT: insertps {{.*#+}} xmm0 = xmm0[0],mem[0],xmm0[2,3
    [all...]
vector-shuffle-128-v4.ll 5 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mcpu=x86-64 -mattr=+sse4.1 | FileCheck %s --check-prefix=ALL --check-prefix=SSE --check-prefix=SSE41
264 ; SSE41-LABEL: shuffle_v4f32_0022:
265 ; SSE41: # BB#0:
266 ; SSE41-NEXT: movsldup {{.*#+}} xmm0 = xmm0[0,0,2,2]
267 ; SSE41-NEXT: retq
292 ; SSE41-LABEL: shuffle_v4f32_1133:
293 ; SSE41: # BB#0:
294 ; SSE41-NEXT: movshdup {{.*#+}} xmm0 = xmm0[1,1,3,3]
295 ; SSE41-NEXT: retq
353 ; SSE41-LABEL: shuffle_v4i32_0124
    [all...]
vector-zext.ll 4 ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+sse4.1 | FileCheck %s --check-prefix=SSE --check-prefix=SSE41
22 ; SSE41-LABEL: zext_16i8_to_8i16:
23 ; SSE41: # BB#0: # %entry
24 ; SSE41-NEXT: pmovzxbw {{.*#+}} xmm0 = xmm0[0],zero,xmm0[1],zero,xmm0[2],zero,xmm0[3],zero,xmm0[4],zero,xmm0[5],zero,xmm0[6],zero,xmm0[7],zero
25 ; SSE41-NEXT: retq
55 ; SSE41-LABEL: zext_16i8_to_16i16:
56 ; SSE41: # BB#0: # %entry
57 ; SSE41-NEXT: movdqa %xmm0, %xmm1
58 ; SSE41-NEXT: pxor %xmm2, %xmm2
59 ; SSE41-NEXT: pmovzxbw {{.*#+}} xmm0 = xmm1[0],zero,xmm1[1],zero,xmm1[2],zero,xmm1[3],zero,xmm1[4],zero (…)
    [all...]
  /external/swiftshader/third_party/subzero/tests_lit/llvm2ice_tests/
vector-ops.ll 8 ; RUN: | FileCheck --check-prefix=SSE41 %s
10 ; RUN: | FileCheck --check-prefix=SSE41 %s
28 ; SSE41-LABEL: insertelement_v4f32_0
29 ; SSE41: insertps {{.*}},{{.*}},0x0
58 ; SSE41-LABEL: insertelement_v4i32_0
59 ; SSE41: pinsrd {{.*}},{{.*}},0x0
81 ; SSE41-LABEL: insertelement_v4f32_1
82 ; SSE41: insertps {{.*}},{{.*}},0x10
104 ; SSE41-LABEL: insertelement_v4i32_1
105 ; SSE41: pinsrd {{.*}},{{.*}},0x
    [all...]
  /external/swiftshader/third_party/LLVM/test/CodeGen/X86/
2008-04-24-pblendw-fold-crash.ll 1 ; RUN: llc < %s -mattr=+sse41
11 %tmp129 = call <8 x i16> @llvm.x86.sse41.pblendw( <8 x i16> zeroinitializer, <8 x i16> %tmp126, i32 2 ) nounwind ; <<8 x i16>> [#uses=0]
15 declare <8 x i16> @llvm.x86.sse41.pblendw(<8 x i16>, <8 x i16>, i32) nounwind
movgs.ll 1 ; RUN: llc < %s -march=x86 -mtriple=i386-linux-gnu -mattr=sse41 | FileCheck %s --check-prefix=X32
2 ; RUN: llc < %s -mtriple=x86_64-linux -mattr=sse41 | FileCheck %s --check-prefix=X64
3 ; RUN: llc < %s -mtriple=x86_64-win32 -mattr=sse41 | FileCheck %s --check-prefix=X64
44 %2 = tail call <4 x i32> @llvm.x86.sse41.pmovsxwd(<8 x i16> %1) nounwind readnone
58 declare <4 x i32> @llvm.x86.sse41.pmovsxwd(<8 x i16>) nounwind readnone
  /external/clang/test/CodeGen/
sse41-builtins.c 9 // NOTE: This should match the tests in llvm/test/CodeGen/X86/sse41-intrinsics-fast-isel.ll
31 // CHECK: call <16 x i8> @llvm.x86.sse41.pblendvb(<16 x i8> %{{.*}}, <16 x i8> %{{.*}}, <16 x i8> %{{.*}})
37 // CHECK: call <2 x double> @llvm.x86.sse41.blendvpd(<2 x double> %{{.*}}, <2 x double> %{{.*}}, <2 x double> %{{.*}})
43 // CHECK: call <4 x float> @llvm.x86.sse41.blendvps(<4 x float> %{{.*}}, <4 x float> %{{.*}}, <4 x float> %{{.*}})
49 // CHECK: call <2 x double> @llvm.x86.sse41.round.pd(<2 x double> %{{.*}}, i32 2)
55 // CHECK: call <4 x float> @llvm.x86.sse41.round.ps(<4 x float> %{{.*}}, i32 2)
61 // CHECK: call <2 x double> @llvm.x86.sse41.round.sd(<2 x double> %{{.*}}, <2 x double> %{{.*}}, i32 2)
67 // CHECK: call <4 x float> @llvm.x86.sse41.round.ss(<4 x float> %{{.*}}, <4 x float> %{{.*}}, i32 2)
164 // CHECK: call <2 x double> @llvm.x86.sse41.dppd(<2 x double> {{.*}}, <2 x double> {{.*}}, i8 7)
170 // CHECK: call <4 x float> @llvm.x86.sse41.dpps(<4 x float> {{.*}}, <4 x float> {{.*}}, i8 7
    [all...]

Completed in 989 milliseconds

12 3 4 5 6 7 8 9