Lines Matching refs:AVX512F
3 …-mtriple=i386-unknown-linux-gnu -mcpu=knl -mattr=+avx512bw | FileCheck %s --check-prefix=AVX512F-32
17 ; AVX512F-32-LABEL: test_mask_adds_epi16_rr_512:
18 ; AVX512F-32: # %bb.0:
19 ; AVX512F-32-NEXT: vpaddsw %zmm1, %zmm0, %zmm0
20 ; AVX512F-32-NEXT: retl
34 ; AVX512F-32-LABEL: test_mask_adds_epi16_rrk_512:
35 ; AVX512F-32: # %bb.0:
36 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
37 ; AVX512F-32-NEXT: vpaddsw %zmm1, %zmm0, %zmm2 {%k1}
38 ; AVX512F-32-NEXT: vmovdqa64 %zmm2, %zmm0
39 ; AVX512F-32-NEXT: retl
53 ; AVX512F-32-LABEL: test_mask_adds_epi16_rrkz_512:
54 ; AVX512F-32: # %bb.0:
55 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
56 ; AVX512F-32-NEXT: vpaddsw %zmm1, %zmm0, %zmm0 {%k1} {z}
57 ; AVX512F-32-NEXT: retl
70 ; AVX512F-32-LABEL: test_mask_adds_epi16_rm_512:
71 ; AVX512F-32: # %bb.0:
72 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
73 ; AVX512F-32-NEXT: vpaddsw (%eax), %zmm0, %zmm0
74 ; AVX512F-32-NEXT: retl
88 ; AVX512F-32-LABEL: test_mask_adds_epi16_rmk_512:
89 ; AVX512F-32: # %bb.0:
90 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
91 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
92 ; AVX512F-32-NEXT: vpaddsw (%eax), %zmm0, %zmm1 {%k1}
93 ; AVX512F-32-NEXT: vmovdqa64 %zmm1, %zmm0
94 ; AVX512F-32-NEXT: retl
109 ; AVX512F-32-LABEL: test_mask_adds_epi16_rmkz_512:
110 ; AVX512F-32: # %bb.0:
111 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
112 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
113 ; AVX512F-32-NEXT: vpaddsw (%eax), %zmm0, %zmm0 {%k1} {z}
114 ; AVX512F-32-NEXT: retl
128 ; AVX512F-32-LABEL: test_mask_subs_epi16_rr_512:
129 ; AVX512F-32: # %bb.0:
130 ; AVX512F-32-NEXT: vpsubsw %zmm1, %zmm0, %zmm0
131 ; AVX512F-32-NEXT: retl
145 ; AVX512F-32-LABEL: test_mask_subs_epi16_rrk_512:
146 ; AVX512F-32: # %bb.0:
147 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
148 ; AVX512F-32-NEXT: vpsubsw %zmm1, %zmm0, %zmm2 {%k1}
149 ; AVX512F-32-NEXT: vmovdqa64 %zmm2, %zmm0
150 ; AVX512F-32-NEXT: retl
164 ; AVX512F-32-LABEL: test_mask_subs_epi16_rrkz_512:
165 ; AVX512F-32: # %bb.0:
166 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
167 ; AVX512F-32-NEXT: vpsubsw %zmm1, %zmm0, %zmm0 {%k1} {z}
168 ; AVX512F-32-NEXT: retl
181 ; AVX512F-32-LABEL: test_mask_subs_epi16_rm_512:
182 ; AVX512F-32: # %bb.0:
183 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
184 ; AVX512F-32-NEXT: vpsubsw (%eax), %zmm0, %zmm0
185 ; AVX512F-32-NEXT: retl
199 ; AVX512F-32-LABEL: test_mask_subs_epi16_rmk_512:
200 ; AVX512F-32: # %bb.0:
201 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
202 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
203 ; AVX512F-32-NEXT: vpsubsw (%eax), %zmm0, %zmm1 {%k1}
204 ; AVX512F-32-NEXT: vmovdqa64 %zmm1, %zmm0
205 ; AVX512F-32-NEXT: retl
220 ; AVX512F-32-LABEL: test_mask_subs_epi16_rmkz_512:
221 ; AVX512F-32: # %bb.0:
222 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
223 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
224 ; AVX512F-32-NEXT: vpsubsw (%eax), %zmm0, %zmm0 {%k1} {z}
225 ; AVX512F-32-NEXT: retl
241 ; AVX512F-32-LABEL: test_mask_adds_epi16_rr_1024:
242 ; AVX512F-32: # %bb.0:
243 ; AVX512F-32-NEXT: pushl %ebp
244 ; AVX512F-32-NEXT: .cfi_def_cfa_offset 8
245 ; AVX512F-32-NEXT: .cfi_offset %ebp, -8
246 ; AVX512F-32-NEXT: movl %esp, %ebp
247 ; AVX512F-32-NEXT: .cfi_def_cfa_register %ebp
248 ; AVX512F-32-NEXT: andl $-64, %esp
249 ; AVX512F-32-NEXT: subl $64, %esp
250 ; AVX512F-32-NEXT: vpaddsw %zmm2, %zmm0, %zmm0
251 ; AVX512F-32-NEXT: vpaddsw 8(%ebp), %zmm1, %zmm1
252 ; AVX512F-32-NEXT: movl %ebp, %esp
253 ; AVX512F-32-NEXT: popl %ebp
254 ; AVX512F-32-NEXT: .cfi_def_cfa %esp, 4
255 ; AVX512F-32-NEXT: retl
268 ; AVX512F-32-LABEL: test_mask_subs_epi16_rr_1024:
269 ; AVX512F-32: # %bb.0:
270 ; AVX512F-32-NEXT: pushl %ebp
271 ; AVX512F-32-NEXT: .cfi_def_cfa_offset 8
272 ; AVX512F-32-NEXT: .cfi_offset %ebp, -8
273 ; AVX512F-32-NEXT: movl %esp, %ebp
274 ; AVX512F-32-NEXT: .cfi_def_cfa_register %ebp
275 ; AVX512F-32-NEXT: andl $-64, %esp
276 ; AVX512F-32-NEXT: subl $64, %esp
277 ; AVX512F-32-NEXT: vpsubsw %zmm2, %zmm0, %zmm0
278 ; AVX512F-32-NEXT: vpsubsw 8(%ebp), %zmm1, %zmm1
279 ; AVX512F-32-NEXT: movl %ebp, %esp
280 ; AVX512F-32-NEXT: popl %ebp
281 ; AVX512F-32-NEXT: .cfi_def_cfa %esp, 4
282 ; AVX512F-32-NEXT: retl
298 ; AVX512F-32-LABEL: test_mask_adds_epu16_rr_512:
299 ; AVX512F-32: # %bb.0:
300 ; AVX512F-32-NEXT: vpaddusw %zmm1, %zmm0, %zmm0
301 ; AVX512F-32-NEXT: retl
315 ; AVX512F-32-LABEL: test_mask_adds_epu16_rrk_512:
316 ; AVX512F-32: # %bb.0:
317 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
318 ; AVX512F-32-NEXT: vpaddusw %zmm1, %zmm0, %zmm2 {%k1}
319 ; AVX512F-32-NEXT: vmovdqa64 %zmm2, %zmm0
320 ; AVX512F-32-NEXT: retl
334 ; AVX512F-32-LABEL: test_mask_adds_epu16_rrkz_512:
335 ; AVX512F-32: # %bb.0:
336 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
337 ; AVX512F-32-NEXT: vpaddusw %zmm1, %zmm0, %zmm0 {%k1} {z}
338 ; AVX512F-32-NEXT: retl
351 ; AVX512F-32-LABEL: test_mask_adds_epu16_rm_512:
352 ; AVX512F-32: # %bb.0:
353 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
354 ; AVX512F-32-NEXT: vpaddusw (%eax), %zmm0, %zmm0
355 ; AVX512F-32-NEXT: retl
369 ; AVX512F-32-LABEL: test_mask_adds_epu16_rmk_512:
370 ; AVX512F-32: # %bb.0:
371 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
372 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
373 ; AVX512F-32-NEXT: vpaddusw (%eax), %zmm0, %zmm1 {%k1}
374 ; AVX512F-32-NEXT: vmovdqa64 %zmm1, %zmm0
375 ; AVX512F-32-NEXT: retl
390 ; AVX512F-32-LABEL: test_mask_adds_epu16_rmkz_512:
391 ; AVX512F-32: # %bb.0:
392 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
393 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
394 ; AVX512F-32-NEXT: vpaddusw (%eax), %zmm0, %zmm0 {%k1} {z}
395 ; AVX512F-32-NEXT: retl
409 ; AVX512F-32-LABEL: test_mask_subs_epu16_rr_512:
410 ; AVX512F-32: # %bb.0:
411 ; AVX512F-32-NEXT: vpsubusw %zmm1, %zmm0, %zmm0
412 ; AVX512F-32-NEXT: retl
426 ; AVX512F-32-LABEL: test_mask_subs_epu16_rrk_512:
427 ; AVX512F-32: # %bb.0:
428 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
429 ; AVX512F-32-NEXT: vpsubusw %zmm1, %zmm0, %zmm2 {%k1}
430 ; AVX512F-32-NEXT: vmovdqa64 %zmm2, %zmm0
431 ; AVX512F-32-NEXT: retl
445 ; AVX512F-32-LABEL: test_mask_subs_epu16_rrkz_512:
446 ; AVX512F-32: # %bb.0:
447 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
448 ; AVX512F-32-NEXT: vpsubusw %zmm1, %zmm0, %zmm0 {%k1} {z}
449 ; AVX512F-32-NEXT: retl
462 ; AVX512F-32-LABEL: test_mask_subs_epu16_rm_512:
463 ; AVX512F-32: # %bb.0:
464 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
465 ; AVX512F-32-NEXT: vpsubusw (%eax), %zmm0, %zmm0
466 ; AVX512F-32-NEXT: retl
480 ; AVX512F-32-LABEL: test_mask_subs_epu16_rmk_512:
481 ; AVX512F-32: # %bb.0:
482 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
483 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
484 ; AVX512F-32-NEXT: vpsubusw (%eax), %zmm0, %zmm1 {%k1}
485 ; AVX512F-32-NEXT: vmovdqa64 %zmm1, %zmm0
486 ; AVX512F-32-NEXT: retl
501 ; AVX512F-32-LABEL: test_mask_subs_epu16_rmkz_512:
502 ; AVX512F-32: # %bb.0:
503 ; AVX512F-32-NEXT: movl {{[0-9]+}}(%esp), %eax
504 ; AVX512F-32-NEXT: kmovd {{[0-9]+}}(%esp), %k1
505 ; AVX512F-32-NEXT: vpsubusw (%eax), %zmm0, %zmm0 {%k1} {z}
506 ; AVX512F-32-NEXT: retl
522 ; AVX512F-32-LABEL: test_mask_adds_epu16_rr_1024:
523 ; AVX512F-32: # %bb.0:
524 ; AVX512F-32-NEXT: pushl %ebp
525 ; AVX512F-32-NEXT: .cfi_def_cfa_offset 8
526 ; AVX512F-32-NEXT: .cfi_offset %ebp, -8
527 ; AVX512F-32-NEXT: movl %esp, %ebp
528 ; AVX512F-32-NEXT: .cfi_def_cfa_register %ebp
529 ; AVX512F-32-NEXT: andl $-64, %esp
530 ; AVX512F-32-NEXT: subl $64, %esp
531 ; AVX512F-32-NEXT: vpaddusw %zmm2, %zmm0, %zmm0
532 ; AVX512F-32-NEXT: vpaddusw 8(%ebp), %zmm1, %zmm1
533 ; AVX512F-32-NEXT: movl %ebp, %esp
534 ; AVX512F-32-NEXT: popl %ebp
535 ; AVX512F-32-NEXT: .cfi_def_cfa %esp, 4
536 ; AVX512F-32-NEXT: retl
549 ; AVX512F-32-LABEL: test_mask_subs_epu16_rr_1024:
550 ; AVX512F-32: # %bb.0:
551 ; AVX512F-32-NEXT: pushl %ebp
552 ; AVX512F-32-NEXT: .cfi_def_cfa_offset 8
553 ; AVX512F-32-NEXT: .cfi_offset %ebp, -8
554 ; AVX512F-32-NEXT: movl %esp, %ebp
555 ; AVX512F-32-NEXT: .cfi_def_cfa_register %ebp
556 ; AVX512F-32-NEXT: andl $-64, %esp
557 ; AVX512F-32-NEXT: subl $64, %esp
558 ; AVX512F-32-NEXT: vpsubusw %zmm2, %zmm0, %zmm0
559 ; AVX512F-32-NEXT: vpsubusw 8(%ebp), %zmm1, %zmm1
560 ; AVX512F-32-NEXT: movl %ebp, %esp
561 ; AVX512F-32-NEXT: popl %ebp
562 ; AVX512F-32-NEXT: .cfi_def_cfa %esp, 4
563 ; AVX512F-32-NEXT: retl