• Home
  • Raw
  • Download

Lines Matching refs:AVX512F

3 …wn-linux-gnu -mcpu=knl -mattr=+avx512bw | FileCheck %s --check-prefix=ALL --check-prefix=AVX512F-32
15 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_storeu_b_512:
16 ; AVX512F-32: # BB#0:
17 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
18 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %ecx
19 ; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k1
20 ; AVX512F-32-NEXT: vmovdqu8 %zmm0, (%ecx) {%k1}
21 ; AVX512F-32-NEXT: vmovdqu8 %zmm0, (%eax)
22 ; AVX512F-32-NEXT: retl
38 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_storeu_w_512:
39 ; AVX512F-32: # BB#0:
40 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
41 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %ecx
42 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
43 ; AVX512F-32-NEXT: vmovdqu16 %zmm0, (%ecx) {%k1}
44 ; AVX512F-32-NEXT: vmovdqu16 %zmm0, (%eax)
45 ; AVX512F-32-NEXT: retl
63 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_loadu_w_512:
64 ; AVX512F-32: # BB#0:
65 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
66 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %ecx
67 ; AVX512F-32-NEXT: vmovdqu16 (%ecx), %zmm0
68 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
69 ; AVX512F-32-NEXT: vmovdqu16 (%eax), %zmm0 {%k1}
70 ; AVX512F-32-NEXT: vmovdqu16 (%ecx), %zmm1 {%k1} {z}
71 ; AVX512F-32-NEXT: vpaddw %zmm1, %zmm0, %zmm0
72 ; AVX512F-32-NEXT: retl
92 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_loadu_b_512:
93 ; AVX512F-32: # BB#0:
94 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
95 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %ecx
96 ; AVX512F-32-NEXT: vmovdqu8 (%ecx), %zmm0
97 ; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k1
98 ; AVX512F-32-NEXT: vmovdqu8 (%eax), %zmm0 {%k1}
99 ; AVX512F-32-NEXT: vmovdqu8 (%ecx), %zmm1 {%k1} {z}
100 ; AVX512F-32-NEXT: vpaddb %zmm1, %zmm0, %zmm0
101 ; AVX512F-32-NEXT: retl
119 ; AVX512F-32-LABEL: test_int_x86_avx512_psll_dq_512:
120 ; AVX512F-32: # BB#0:
121 ; AVX512F-32-NEXT: vpslldq {{.*#+}} zmm1 = zero,zero,zero,zero,zero,zero,zero,zero,zmm0[0,1,2,3,…
122 ; AVX512F-32-NEXT: vpslldq {{.*#+}} zmm0 = zero,zero,zero,zero,zmm0[0,1,2,3,4,5,6,7,8,9,10,11],z…
123 ; AVX512F-32-NEXT: vpaddq %zmm0, %zmm1, %zmm0
124 ; AVX512F-32-NEXT: retl
137 ; AVX512F-32-LABEL: test_int_x86_avx512_psll_load_dq_512:
138 ; AVX512F-32: # BB#0:
139 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
140 ; AVX512F-32-NEXT: vpslldq {{.*#+}} zmm0 = zero,zero,zero,zero,mem[0,1,2,3,4,5,6,7,8,9,10,11],ze…
141 ; AVX512F-32-NEXT: retl
157 ; AVX512F-32-LABEL: test_int_x86_avx512_psrl_dq_512:
158 ; AVX512F-32: # BB#0:
159 ; AVX512F-32-NEXT: vpsrldq {{.*#+}} zmm1 = zmm0[8,9,10,11,12,13,14,15],zero,zero,zero,zero,zero,…
160 ; AVX512F-32-NEXT: vpsrldq {{.*#+}} zmm0 = zmm0[4,5,6,7,8,9,10,11,12,13,14,15],zero,zero,zero,ze…
161 ; AVX512F-32-NEXT: vpaddq %zmm0, %zmm1, %zmm0
162 ; AVX512F-32-NEXT: retl
175 ; AVX512F-32-LABEL: test_int_x86_avx512_psrl_load_dq_512:
176 ; AVX512F-32: # BB#0:
177 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
178 ; AVX512F-32-NEXT: vpsrldq {{.*#+}} zmm0 = mem[4,5,6,7,8,9,10,11,12,13,14,15],zero,zero,zero,zer…
179 ; AVX512F-32-NEXT: retl
198 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_palignr_512:
199 ; AVX512F-32: # BB#0:
200 ; AVX512F-32-NEXT: vpalignr {{.*#+}} zmm3 = zmm1[2,3,4,5,6,7,8,9,10,11,12,13,14,15],zmm0[0,1],zm…
201 ; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k1
202 ; AVX512F-32-NEXT: vpalignr {{.*#+}} zmm2 {%k1} = zmm1[2,3,4,5,6,7,8,9,10,11,12,13,14,15],zmm0[0…
203 ; AVX512F-32-NEXT: vpalignr {{.*#+}} zmm0 {%k1} {z} = zmm1[2,3,4,5,6,7,8,9,10,11,12,13,14,15],zm…
204 ; AVX512F-32-NEXT: vpaddb %zmm0, %zmm2, %zmm0
205 ; AVX512F-32-NEXT: vpaddb %zmm3, %zmm0, %zmm0
206 ; AVX512F-32-NEXT: retl
228 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_pshufh_w_512:
229 ; AVX512F-32: # BB#0:
230 ; AVX512F-32-NEXT: vpshufhw {{.*#+}} zmm2 = zmm0[0,1,2,3,7,4,4,4,8,9,10,11,15,12,12,12,16,17,18,…
231 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
232 ; AVX512F-32-NEXT: vpshufhw {{.*#+}} zmm1 {%k1} = zmm0[0,1,2,3,7,4,4,4,8,9,10,11,15,12,12,12,16,…
233 ; AVX512F-32-NEXT: vpshufhw {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3,7,4,4,4,8,9,10,11,15,12,12,12…
234 ; AVX512F-32-NEXT: vpaddw %zmm0, %zmm1, %zmm0
235 ; AVX512F-32-NEXT: vpaddw %zmm2, %zmm0, %zmm0
236 ; AVX512F-32-NEXT: retl
258 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_pshufl_w_512:
259 ; AVX512F-32: # BB#0:
260 ; AVX512F-32-NEXT: vpshuflw {{.*#+}} zmm2 = zmm0[3,0,0,0,4,5,6,7,11,8,8,8,12,13,14,15,19,16,16,1…
261 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
262 ; AVX512F-32-NEXT: vpshuflw {{.*#+}} zmm1 {%k1} = zmm0[3,0,0,0,4,5,6,7,11,8,8,8,12,13,14,15,19,1…
263 ; AVX512F-32-NEXT: vpshuflw {{.*#+}} zmm0 {%k1} {z} = zmm0[3,0,0,0,4,5,6,7,11,8,8,8,12,13,14,15,…
264 ; AVX512F-32-NEXT: vpaddw %zmm0, %zmm1, %zmm0
265 ; AVX512F-32-NEXT: vpaddw %zmm2, %zmm0, %zmm0
266 ; AVX512F-32-NEXT: retl
282 ; AVX512F-32-LABEL: test_pcmpeq_b:
283 ; AVX512F-32: # BB#0:
284 ; AVX512F-32-NEXT: subl $12, %esp
285 ; AVX512F-32-NEXT: .Ltmp0:
286 ; AVX512F-32-NEXT: .cfi_def_cfa_offset 16
287 ; AVX512F-32-NEXT: vpcmpeqb %zmm1, %zmm0, %k0
288 ; AVX512F-32-NEXT: kmovq %k0, (%esp)
289 ; AVX512F-32-NEXT: movl (%esp), %eax
290 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %edx
291 ; AVX512F-32-NEXT: addl $12, %esp
292 ; AVX512F-32-NEXT: retl
305 ; AVX512F-32-LABEL: test_mask_pcmpeq_b:
306 ; AVX512F-32: # BB#0:
307 ; AVX512F-32-NEXT: subl $12, %esp
308 ; AVX512F-32-NEXT: .Ltmp1:
309 ; AVX512F-32-NEXT: .cfi_def_cfa_offset 16
310 ; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k1
311 ; AVX512F-32-NEXT: vpcmpeqb %zmm1, %zmm0, %k0 {%k1}
312 ; AVX512F-32-NEXT: kmovq %k0, (%esp)
313 ; AVX512F-32-NEXT: movl (%esp), %eax
314 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %edx
315 ; AVX512F-32-NEXT: addl $12, %esp
316 ; AVX512F-32-NEXT: retl
330 ; AVX512F-32-LABEL: test_pcmpeq_w:
331 ; AVX512F-32: # BB#0:
332 ; AVX512F-32-NEXT: vpcmpeqw %zmm1, %zmm0, %k0
333 ; AVX512F-32-NEXT: kmovd %k0, %eax
334 ; AVX512F-32-NEXT: retl
347 ; AVX512F-32-LABEL: test_mask_pcmpeq_w:
348 ; AVX512F-32: # BB#0:
349 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
350 ; AVX512F-32-NEXT: vpcmpeqw %zmm1, %zmm0, %k0 {%k1}
351 ; AVX512F-32-NEXT: kmovd %k0, %eax
352 ; AVX512F-32-NEXT: retl
366 ; AVX512F-32-LABEL: test_pcmpgt_b:
367 ; AVX512F-32: # BB#0:
368 ; AVX512F-32-NEXT: subl $12, %esp
369 ; AVX512F-32-NEXT: .Ltmp2:
370 ; AVX512F-32-NEXT: .cfi_def_cfa_offset 16
371 ; AVX512F-32-NEXT: vpcmpgtb %zmm1, %zmm0, %k0
372 ; AVX512F-32-NEXT: kmovq %k0, (%esp)
373 ; AVX512F-32-NEXT: movl (%esp), %eax
374 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %edx
375 ; AVX512F-32-NEXT: addl $12, %esp
376 ; AVX512F-32-NEXT: retl
389 ; AVX512F-32-LABEL: test_mask_pcmpgt_b:
390 ; AVX512F-32: # BB#0:
391 ; AVX512F-32-NEXT: subl $12, %esp
392 ; AVX512F-32-NEXT: .Ltmp3:
393 ; AVX512F-32-NEXT: .cfi_def_cfa_offset 16
394 ; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k1
395 ; AVX512F-32-NEXT: vpcmpgtb %zmm1, %zmm0, %k0 {%k1}
396 ; AVX512F-32-NEXT: kmovq %k0, (%esp)
397 ; AVX512F-32-NEXT: movl (%esp), %eax
398 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %edx
399 ; AVX512F-32-NEXT: addl $12, %esp
400 ; AVX512F-32-NEXT: retl
414 ; AVX512F-32-LABEL: test_pcmpgt_w:
415 ; AVX512F-32: # BB#0:
416 ; AVX512F-32-NEXT: vpcmpgtw %zmm1, %zmm0, %k0
417 ; AVX512F-32-NEXT: kmovd %k0, %eax
418 ; AVX512F-32-NEXT: retl
431 ; AVX512F-32-LABEL: test_mask_pcmpgt_w:
432 ; AVX512F-32: # BB#0:
433 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
434 ; AVX512F-32-NEXT: vpcmpgtw %zmm1, %zmm0, %k0 {%k1}
435 ; AVX512F-32-NEXT: kmovd %k0, %eax
436 ; AVX512F-32-NEXT: retl
454 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_punpckhb_w_512:
455 ; AVX512F-32: # BB#0:
456 ; AVX512F-32-NEXT: vpunpckhbw {{.*#+}} zmm3 = zmm0[8],zmm1[8],zmm0[9],zmm1[9],zmm0[10],zmm1[10],…
457 ; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k1
458 ; AVX512F-32-NEXT: vpunpckhbw {{.*#+}} zmm2 {%k1} = zmm0[8],zmm1[8],zmm0[9],zmm1[9],zmm0[10],zmm…
459 ; AVX512F-32-NEXT: vpaddb %zmm3, %zmm2, %zmm0
460 ; AVX512F-32-NEXT: retl
478 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_punpcklb_w_512:
479 ; AVX512F-32: # BB#0:
480 ; AVX512F-32-NEXT: vpunpcklbw {{.*#+}} zmm3 = zmm0[0],zmm1[0],zmm0[1],zmm1[1],zmm0[2],zmm1[2],zm…
481 ; AVX512F-32-NEXT: kmovq {{[0-9]+}}(%esp), %k1
482 ; AVX512F-32-NEXT: vpunpcklbw {{.*#+}} zmm2 {%k1} = zmm0[0],zmm1[0],zmm0[1],zmm1[1],zmm0[2],zmm1…
483 ; AVX512F-32-NEXT: vpaddb %zmm3, %zmm2, %zmm0
484 ; AVX512F-32-NEXT: retl
502 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_punpckhw_d_512:
503 ; AVX512F-32: # BB#0:
504 ; AVX512F-32-NEXT: vpunpckhwd {{.*#+}} zmm3 = zmm0[4],zmm1[4],zmm0[5],zmm1[5],zmm0[6],zmm1[6],zm…
505 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
506 ; AVX512F-32-NEXT: vpunpckhwd {{.*#+}} zmm2 {%k1} = zmm0[4],zmm1[4],zmm0[5],zmm1[5],zmm0[6],zmm1…
507 ; AVX512F-32-NEXT: vpaddw %zmm3, %zmm2, %zmm0
508 ; AVX512F-32-NEXT: retl
526 ; AVX512F-32-LABEL: test_int_x86_avx512_mask_punpcklw_d_512:
527 ; AVX512F-32: # BB#0:
528 ; AVX512F-32-NEXT: vpunpcklwd {{.*#+}} zmm3 = zmm0[0],zmm1[0],zmm0[1],zmm1[1],zmm0[2],zmm1[2],zm…
529 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
530 ; AVX512F-32-NEXT: vpunpcklwd {{.*#+}} zmm2 {%k1} = zmm0[0],zmm1[0],zmm0[1],zmm1[1],zmm0[2],zmm1…
531 ; AVX512F-32-NEXT: vpaddw %zmm3, %zmm2, %zmm0
532 ; AVX512F-32-NEXT: retl