Home | History | Annotate | Download | only in X86

Lines Matching full:next

10 ; AVX512F-NEXT:    vpshufd {{.*#+}} xmm0 = xmm0[2,3,0,1]
11 ; AVX512F-NEXT: retq
15 ; VL_BW_DQ-NEXT: vpsllq $63, %xmm0, %xmm0
16 ; VL_BW_DQ-NEXT: vptestmq %xmm0, %xmm0, %k0
17 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %xmm0
18 ; VL_BW_DQ-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[2,3,0,1]
19 ; VL_BW_DQ-NEXT: vpsllq $63, %xmm0, %xmm0
20 ; VL_BW_DQ-NEXT: vptestmq %xmm0, %xmm0, %k0
21 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %xmm0
22 ; VL_BW_DQ-NEXT: retq
30 ; AVX512F-NEXT: movl $1, %eax
31 ; AVX512F-NEXT: vmovq %rax, %xmm1
32 ; AVX512F-NEXT: vpalignr {{.*#+}} xmm0 = xmm0[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7]
33 ; AVX512F-NEXT: retq
37 ; VL_BW_DQ-NEXT: vpsllq $63, %xmm0, %xmm0
38 ; VL_BW_DQ-NEXT: vptestmq %xmm0, %xmm0, %k0
39 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %xmm0
40 ; VL_BW_DQ-NEXT: movb $1, %al
41 ; VL_BW_DQ-NEXT: kmovb %eax, %k0
42 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %xmm1
43 ; VL_BW_DQ-NEXT: vpalignr {{.*#+}} xmm0 = xmm0[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7]
44 ; VL_BW_DQ-NEXT: vpsllq $63, %xmm0, %xmm0
45 ; VL_BW_DQ-NEXT: vptestmq %xmm0, %xmm0, %k0
46 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %xmm0
47 ; VL_BW_DQ-NEXT: retq
56 ; AVX512F-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[3,2,1,0]
57 ; AVX512F-NEXT: retq
61 ; VL_BW_DQ-NEXT: vpslld $31, %xmm0, %xmm0
62 ; VL_BW_DQ-NEXT: vptestmd %xmm0, %xmm0, %k0
63 ; VL_BW_DQ-NEXT: vpmovm2d %k0, %xmm0
64 ; VL_BW_DQ-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[3,2,1,0]
65 ; VL_BW_DQ-NEXT: vpslld $31, %xmm0, %xmm0
66 ; VL_BW_DQ-NEXT: vptestmd %xmm0, %xmm0, %k0
67 ; VL_BW_DQ-NEXT: vpmovm2d %k0, %xmm0
68 ; VL_BW_DQ-NEXT: retq
76 ; AVX512F-NEXT: vpcmpeqq %zmm2, %zmm0, %k1
77 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
78 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm1 {%k1} {z}
79 ; AVX512F-NEXT: vmovdqa64 {{.*#+}} zmm2 = [3,6,1,0,3,7,7,0]
80 ; AVX512F-NEXT: vpermq %zmm1, %zmm2, %zmm1
81 ; AVX512F-NEXT: vpsllq $63, %zmm1, %zmm1
82 ; AVX512F-NEXT: vptestmq %zmm1, %zmm1, %k1
83 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm0 {%k1} {z}
84 ; AVX512F-NEXT: vpmovqw %zmm0, %xmm0
85 ; AVX512F-NEXT: retq
89 ; VL_BW_DQ-NEXT: vpcmpeqq %zmm2, %zmm0, %k0
90 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %zmm0
91 ; VL_BW_DQ-NEXT: vmovdqa64 {{.*#+}} zmm1 = [3,6,1,0,3,7,7,0]
92 ; VL_BW_DQ-NEXT: vpermq %zmm0, %zmm1, %zmm0
93 ; VL_BW_DQ-NEXT: vpsllq $63, %zmm0, %zmm0
94 ; VL_BW_DQ-NEXT: vptestmq %zmm0, %zmm0, %k0
95 ; VL_BW_DQ-NEXT: vpmovm2w %k0, %xmm0
96 ; VL_BW_DQ-NEXT: retq
106 ; AVX512F-NEXT: vpcmpeqd %zmm2, %zmm0, %k1
107 ; AVX512F-NEXT: vpcmpeqd %zmm3, %zmm1, %k2
108 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
109 ; AVX512F-NEXT: vmovdqa32 %zmm0, %zmm1 {%k2} {z}
110 ; AVX512F-NEXT: vmovdqa32 %zmm0, %zmm2 {%k1} {z}
111 ; AVX512F-NEXT: vmovdqa32 {{.*#+}} zmm3 = [3,6,22,12,3,7,7,0,3,6,1,13,3,21,7,0]
112 ; AVX512F-NEXT: vpermt2d %zmm1, %zmm3, %zmm2
113 ; AVX512F-NEXT: vpslld $31, %zmm2, %zmm1
114 ; AVX512F-NEXT: vptestmd %zmm1, %zmm1, %k1
115 ; AVX512F-NEXT: vmovdqa32 %zmm0, %zmm0 {%k1} {z}
116 ; AVX512F-NEXT: vpmovdb %zmm0, %xmm0
117 ; AVX512F-NEXT: retq
121 ; VL_BW_DQ-NEXT: vpcmpeqd %zmm2, %zmm0, %k0
122 ; VL_BW_DQ-NEXT: vpcmpeqd %zmm3, %zmm1, %k1
123 ; VL_BW_DQ-NEXT: vpmovm2d %k1, %zmm0
124 ; VL_BW_DQ-NEXT: vpmovm2d %k0, %zmm1
125 ; VL_BW_DQ-NEXT: vmovdqa32 {{.*#+}} zmm2 = [3,6,22,12,3,7,7,0,3,6,1,13,3,21,7,0]
126 ; VL_BW_DQ-NEXT: vpermt2d %zmm0, %zmm2, %zmm1
127 ; VL_BW_DQ-NEXT: vpslld $31, %zmm1, %zmm0
128 ; VL_BW_DQ-NEXT: vptestmd %zmm0, %zmm0, %k0
129 ; VL_BW_DQ-NEXT: vpmovm2b %k0, %xmm0
130 ; VL_BW_DQ-NEXT: retq
140 ; AVX512F-NEXT: vperm2i128 {{.*#+}} ymm1 = ymm0[2,3,0,1]
141 ; AVX512F-NEXT: vpshufb {{.*#+}} ymm1 = ymm1[u,u,6,u,u,u,u,u,u,u,u,u,u,5,u,u,19,22,u,28,19,23,23,16,19,22,17,29,19,u,23,16]
142 ; AVX512F-NEXT: vpshufb {{.*#+}} ymm0 = ymm0[3,6,u,12,3,7,7,0,3,6,1,13,3,u,7,0,u,u,22,u,u,u,u,u,u,u,u,u,u,21,u,u]
143 ; AVX512F-NEXT: vmovdqa {{.*#+}} ymm2 = [255,255,0,255,255,255,255,255,255,255,255,255,255,0,255,255,0,0,255,0,0,0,0,0,0,0,0,0,0,255,0,0]
144 ; AVX512F-NEXT: vpblendvb %ymm2, %ymm0, %ymm1, %ymm0
145 ; AVX512F-NEXT: retq
149 ; VL_BW_DQ-NEXT: vpsllw $7, %ymm0, %ymm0
150 ; VL_BW_DQ-NEXT: vpmovb2m %ymm0, %k0
151 ; VL_BW_DQ-NEXT: vpmovm2w %k0, %zmm0
152 ; VL_BW_DQ-NEXT: vmovdqu16 {{.*#+}} zmm1 = [3,6,22,12,3,7,7,0,3,6,1,13,3,21,7,0,3,6,22,12,3,7,7,0,3,6,1,13,3,21,7,0]
153 ; VL_BW_DQ-NEXT: vpermw %zmm0, %zmm1, %zmm0
154 ; VL_BW_DQ-NEXT: vpsllw $15, %zmm0, %zmm0
155 ; VL_BW_DQ-NEXT: vpmovw2m %zmm0, %k0
156 ; VL_BW_DQ-NEXT: vpmovm2b %k0, %ymm0
157 ; VL_BW_DQ-NEXT: retq
165 ; AVX512F-NEXT: kmovw %edi, %k1
166 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
167 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm1 {%k1} {z}
168 ; AVX512F-NEXT: vextracti32x4 $1, %zmm1, %xmm1
169 ; AVX512F-NEXT: vpbroadcastq %xmm1, %zmm1
170 ; AVX512F-NEXT: vpsllq $63, %zmm1, %zmm1
171 ; AVX512F-NEXT: vptestmq %zmm1, %zmm1, %k1
172 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm0 {%k1} {z}
173 ; AVX512F-NEXT: vpmovqw %zmm0, %xmm0
174 ; AVX512F-NEXT: retq
178 ; VL_BW_DQ-NEXT: kmovb %edi, %k0
179 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %zmm0
180 ; VL_BW_DQ-NEXT: vextracti64x2 $1, %zmm0, %xmm0
181 ; VL_BW_DQ-NEXT: vpbroadcastq %xmm0, %zmm0
182 ; VL_BW_DQ-NEXT: vpsllq $63, %zmm0, %zmm0
183 ; VL_BW_DQ-NEXT: vptestmq %zmm0, %zmm0, %k0
184 ; VL_BW_DQ-NEXT: vpmovm2w %k0, %xmm0
185 ; VL_BW_DQ-NEXT: retq
194 ; AVX512F-NEXT: kmovw %edi, %k1
195 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
196 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm0 {%k1} {z}
197 ; AVX512F-NEXT: vpxord %zmm1, %zmm1, %zmm1
198 ; AVX512F-NEXT: vmovdqa64 {{.*#+}} zmm2 = <8,2,10,u,3,u,2,u>
199 ; AVX512F-NEXT: vpermt2q %zmm1, %zmm2, %zmm0
200 ; AVX512F-NEXT: vpsllq $63, %zmm0, %zmm0
201 ; AVX512F-NEXT: vptestmq %zmm0, %zmm0, %k0
202 ; AVX512F-NEXT: kmovw %k0, %eax
203 ; AVX512F-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
204 ; AVX512F-NEXT: retq
208 ; VL_BW_DQ-NEXT: kmovb %edi, %k0
209 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %zmm0
210 ; VL_BW_DQ-NEXT: vpxord %zmm1, %zmm1, %zmm1
211 ; VL_BW_DQ-NEXT: vmovdqa64 {{.*#+}} zmm2 = <8,2,10,u,3,u,2,u>
212 ; VL_BW_DQ-NEXT: vpermt2q %zmm1, %zmm2, %zmm0
213 ; VL_BW_DQ-NEXT: vpsllq $63, %zmm0, %zmm0
214 ; VL_BW_DQ-NEXT: vptestmq %zmm0, %zmm0, %k0
215 ; VL_BW_DQ-NEXT: kmovb %k0, %eax
216 ; VL_BW_DQ-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
217 ; VL_BW_DQ-NEXT: retq
227 ; AVX512F-NEXT: kmovw %edi, %k1
228 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
229 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm0 {%k1} {z}
230 ; AVX512F-NEXT: vshufi64x2 {{.*#+}} zmm0 = zmm0[0,1,4,5,0,1,0,1]
231 ; AVX512F-NEXT: vpsllq $63, %zmm0, %zmm0
232 ; AVX512F-NEXT: vptestmq %zmm0, %zmm0, %k0
233 ; AVX512F-NEXT: kmovw %k0, %eax
234 ; AVX512F-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
235 ; AVX512F-NEXT: retq
239 ; VL_BW_DQ-NEXT: kmovb %edi, %k0
240 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %zmm0
241 ; VL_BW_DQ-NEXT: vshufi64x2 {{.*#+}} zmm0 = zmm0[0,1,4,5,0,1,0,1]
242 ; VL_BW_DQ-NEXT: vpsllq $63, %zmm0, %zmm0
243 ; VL_BW_DQ-NEXT: vptestmq %zmm0, %zmm0, %k0
244 ; VL_BW_DQ-NEXT: kmovb %k0, %eax
245 ; VL_BW_DQ-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
246 ; VL_BW_DQ-NEXT: retq
256 ; AVX512F-NEXT: kmovw %edi, %k1
257 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
258 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm0 {%k1} {z}
259 ; AVX512F-NEXT: vpxord %zmm1, %zmm1, %zmm1
260 ; AVX512F-NEXT: vmovdqa64 {{.*#+}} zmm2 = [8,6,1,0,3,7,7,0]
261 ; AVX512F-NEXT: vpermt2q %zmm1, %zmm2, %zmm0
262 ; AVX512F-NEXT: vpsllq $63, %zmm0, %zmm0
263 ; AVX512F-NEXT: vptestmq %zmm0, %zmm0, %k0
264 ; AVX512F-NEXT: kmovw %k0, %eax
265 ; AVX512F-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
266 ; AVX512F-NEXT: retq
270 ; VL_BW_DQ-NEXT: kmovb %edi, %k0
271 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %zmm0
272 ; VL_BW_DQ-NEXT: vpxord %zmm1, %zmm1, %zmm1
273 ; VL_BW_DQ-NEXT: vmovdqa64 {{.*#+}} zmm2 = [8,6,1,0,3,7,7,0]
274 ; VL_BW_DQ-NEXT: vpermt2q %zmm1, %zmm2, %zmm0
275 ; VL_BW_DQ-NEXT: vpsllq $63, %zmm0, %zmm0
276 ; VL_BW_DQ-NEXT: vptestmq %zmm0, %zmm0, %k0
277 ; VL_BW_DQ-NEXT: kmovb %k0, %eax
278 ; VL_BW_DQ-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
279 ; VL_BW_DQ-NEXT: retq
289 ; AVX512F-NEXT: kmovw %edi, %k1
290 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
291 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm0 {%k1} {z}
292 ; AVX512F-NEXT: vmovdqa64 {{.*#+}} zmm1 = [9,1,2,10,4,5,6,7]
293 ; AVX512F-NEXT: vpxord %zmm2, %zmm2, %zmm2
294 ; AVX512F-NEXT: vpermt2q %zmm0, %zmm1, %zmm2
295 ; AVX512F-NEXT: vpsllq $63, %zmm2, %zmm0
296 ; AVX512F-NEXT: vptestmq %zmm0, %zmm0, %k0
297 ; AVX512F-NEXT: kmovw %k0, %eax
298 ; AVX512F-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
299 ; AVX512F-NEXT: retq
303 ; VL_BW_DQ-NEXT: kmovb %edi, %k0
304 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %zmm0
305 ; VL_BW_DQ-NEXT: vmovdqa64 {{.*#+}} zmm1 = [9,1,2,10,4,5,6,7]
306 ; VL_BW_DQ-NEXT: vpxord %zmm2, %zmm2, %zmm2
307 ; VL_BW_DQ-NEXT: vpermt2q %zmm0, %zmm1, %zmm2
308 ; VL_BW_DQ-NEXT: vpsllq $63, %zmm2, %zmm0
309 ; VL_BW_DQ-NEXT: vptestmq %zmm0, %zmm0, %k0
310 ; VL_BW_DQ-NEXT: kmovb %k0, %eax
311 ; VL_BW_DQ-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
312 ; VL_BW_DQ-NEXT: retq
322 ; AVX512F-NEXT: kmovw %edi, %k1
323 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
324 ; AVX512F-NEXT: movb $51, %al
325 ; AVX512F-NEXT: kmovw %eax, %k2
326 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm1 {%k2} {z}
327 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm0 {%k1} {z}
328 ; AVX512F-NEXT: vmovdqa64 {{.*#+}} zmm2 = [9,6,1,0,3,7,7,1]
329 ; AVX512F-NEXT: vpermt2q %zmm0, %zmm2, %zmm1
330 ; AVX512F-NEXT: vpsllq $63, %zmm1, %zmm0
331 ; AVX512F-NEXT: vptestmq %zmm0, %zmm0, %k0
332 ; AVX512F-NEXT: kmovw %k0, %eax
333 ; AVX512F-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
334 ; AVX512F-NEXT: retq
338 ; VL_BW_DQ-NEXT: kmovb %edi, %k0
339 ; VL_BW_DQ-NEXT: movb $51, %al
340 ; VL_BW_DQ-NEXT: kmovb %eax, %k1
341 ; VL_BW_DQ-NEXT: vpmovm2q %k1, %zmm0
342 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %zmm1
343 ; VL_BW_DQ-NEXT: vmovdqa64 {{.*#+}} zmm2 = [9,6,1,0,3,7,7,1]
344 ; VL_BW_DQ-NEXT: vpermt2q %zmm1, %zmm2, %zmm0
345 ; VL_BW_DQ-NEXT: vpsllq $63, %zmm0, %zmm0
346 ; VL_BW_DQ-NEXT: vptestmq %zmm0, %zmm0, %k0
347 ; VL_BW_DQ-NEXT: kmovb %k0, %eax
348 ; VL_BW_DQ-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
349 ; VL_BW_DQ-NEXT: retq
359 ; AVX512F-NEXT: vpmovsxwq %xmm0, %zmm0
360 ; AVX512F-NEXT: vpsllq $63, %zmm0, %zmm0
361 ; AVX512F-NEXT: vptestmq %zmm0, %zmm0, %k1
362 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
363 ; AVX512F-NEXT: vmovdqa64 %zmm0, %zmm1 {%k1} {z}
364 ; AVX512F-NEXT: vmovdqa64 {{.*#+}} zmm2 = [9,1,2,3,4,5,6,7]
365 ; AVX512F-NEXT: vpermt2q %zmm1, %zmm2, %zmm0
366 ; AVX512F-NEXT: vpsllq $63, %zmm0, %zmm0
367 ; AVX512F-NEXT: vptestmq %zmm0, %zmm0, %k0
368 ; AVX512F-NEXT: kmovw %k0, %eax
369 ; AVX512F-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
370 ; AVX512F-NEXT: retq
374 ; VL_BW_DQ-NEXT: vpsllw $15, %xmm0, %xmm0
375 ; VL_BW_DQ-NEXT: vpmovw2m %xmm0, %k0
376 ; VL_BW_DQ-NEXT: vpmovm2q %k0, %zmm0
377 ; VL_BW_DQ-NEXT: vmovdqa64 {{.*#+}} zmm1 = [9,1,2,3,4,5,6,7]
378 ; VL_BW_DQ-NEXT: vpternlogd $255, %zmm2, %zmm2, %zmm2
379 ; VL_BW_DQ-NEXT: vpermt2q %zmm0, %zmm1, %zmm2
380 ; VL_BW_DQ-NEXT: vpsllq $63, %zmm2, %zmm0
381 ; VL_BW_DQ-NEXT: vptestmq %zmm0, %zmm0, %k0
382 ; VL_BW_DQ-NEXT: kmovb %k0, %eax
383 ; VL_BW_DQ-NEXT: # kill: %AL<def> %AL<kill> %EAX<kill>
384 ; VL_BW_DQ-NEXT: retq
394 ; AVX512F-NEXT: kmovw %edi, %k1
395 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
396 ; AVX512F-NEXT: vmovdqa32 %zmm0, %zmm0 {%k1} {z}
397 ; AVX512F-NEXT: vpbroadcastd %xmm0, %zmm0
398 ; AVX512F-NEXT: vpslld $31, %zmm0, %zmm0
399 ; AVX512F-NEXT: vptestmd %zmm0, %zmm0, %k0
400 ; AVX512F-NEXT: kmovw %k0, %eax
401 ; AVX512F-NEXT: # kill: %AX<def> %AX<kill> %EAX<kill>
402 ; AVX512F-NEXT: retq
406 ; VL_BW_DQ-NEXT: kmovw %edi, %k0
407 ; VL_BW_DQ-NEXT: vpmovm2d %k0, %zmm0
408 ; VL_BW_DQ-NEXT: vpbroadcastd %xmm0, %zmm0
409 ; VL_BW_DQ-NEXT: vpslld $31, %zmm0, %zmm0
410 ; VL_BW_DQ-NEXT: vptestmd %zmm0, %zmm0, %k0
411 ; VL_BW_DQ-NEXT: kmovw %k0, %eax
412 ; VL_BW_DQ-NEXT: # kill: %AX<def> %AX<kill> %EAX<kill>
413 ; VL_BW_DQ-NEXT: retq
423 ; AVX512F-NEXT: pushq %rbp
424 ; AVX512F-NEXT: .Ltmp0:
425 ; AVX512F-NEXT: .cfi_def_cfa_offset 16
426 ; AVX512F-NEXT: .Ltmp1:
427 ; AVX512F-NEXT: .cfi_offset %rbp, -16
428 ; AVX512F-NEXT: movq %rsp, %rbp
429 ; AVX512F-NEXT: .Ltmp2:
430 ; AVX512F-NEXT: .cfi_def_cfa_register %rbp
431 ; AVX512F-NEXT: andq $-32, %rsp
432 ; AVX512F-NEXT: subq $96, %rsp
433 ; AVX512F-NEXT: movl %edi, {{[0-9]+}}(%rsp)
434 ; AVX512F-NEXT: vpternlogd $255, %zmm0, %zmm0, %zmm0
435 ; AVX512F-NEXT: kmovw {{[0-9]+}}(%rsp), %k1
436 ; AVX512F-NEXT: vmovdqa32 %zmm0, %zmm0 {%k1} {z}
437 ; AVX512F-NEXT: vpmovdb %zmm0, %xmm0
438 ; AVX512F-NEXT: vpbroadcastb %xmm0, %ymm0
439 ; AVX512F-NEXT: vextracti128 $1, %ymm0, %xmm1
440 ; AVX512F-NEXT: vpmovsxbd %xmm1, %zmm1
441 ; AVX512F-NEXT: vpslld $31, %zmm1, %zmm1
442 ; AVX512F-NEXT: vptestmd %zmm1, %zmm1, %k0
443 ; AVX512F-NEXT: kmovw %k0, {{[0-9]+}}(%rsp)
444 ; AVX512F-NEXT: vpmovsxbd %xmm0, %zmm0
445 ; AVX512F-NEXT: vpslld $31, %zmm0, %zmm0
446 ; AVX512F-NEXT: vptestmd %zmm0, %zmm0, %k0
447 ; AVX512F-NEXT: kmovw %k0, (%rsp)
448 ; AVX512F-NEXT: movl (%rsp), %ecx
449 ; AVX512F-NEXT: movq %rcx, %rax
450 ; AVX512F-NEXT: shlq $32, %rax
451 ; AVX512F-NEXT: orq %rcx, %rax
452 ; AVX512F-NEXT: movq %rbp, %rsp
453 ; AVX512F-NEXT: popq %rbp
454 ; AVX512F-NEXT: retq
458 ; VL_BW_DQ-NEXT: kmovq %rdi, %k0
459 ; VL_BW_DQ-NEXT: vpmovm2b %k0, %zmm0
460 ; VL_BW_DQ-NEXT: vpbroadcastb %xmm0, %zmm0
461 ; VL_BW_DQ-NEXT: vpsllw $7, %zmm0, %zmm0
462 ; VL_BW_DQ-NEXT: vpmovb2m %zmm0, %k0
463 ; VL_BW_DQ-NEXT: kmovq %k0, %rax
464 ; VL_BW_DQ-NEXT: retq