Lines Matching refs:AVX512BW
2 …4-apple-darwin -mcpu=knl -mattr=+avx512bw | FileCheck %s --check-prefix=ALL --check-prefix=AVX512BW
8 ; AVX512BW-LABEL: test_int_x86_avx512_mask_storeu_b_512:
9 ; AVX512BW: ## BB#0:
10 ; AVX512BW-NEXT: kmovq %rdx, %k1
11 ; AVX512BW-NEXT: vmovdqu8 %zmm0, (%rdi) {%k1}
12 ; AVX512BW-NEXT: vmovdqu8 %zmm0, (%rsi)
13 ; AVX512BW-NEXT: retq
31 ; AVX512BW-LABEL: test_int_x86_avx512_mask_storeu_w_512:
32 ; AVX512BW: ## BB#0:
33 ; AVX512BW-NEXT: kmovd %edx, %k1
34 ; AVX512BW-NEXT: vmovdqu16 %zmm0, (%rdi) {%k1}
35 ; AVX512BW-NEXT: vmovdqu16 %zmm0, (%rsi)
36 ; AVX512BW-NEXT: retq
54 ; AVX512BW-LABEL: test_int_x86_avx512_mask_loadu_w_512:
55 ; AVX512BW: ## BB#0:
56 ; AVX512BW-NEXT: vmovdqu16 (%rdi), %zmm0
57 ; AVX512BW-NEXT: kmovd %edx, %k1
58 ; AVX512BW-NEXT: vmovdqu16 (%rsi), %zmm0 {%k1}
59 ; AVX512BW-NEXT: vmovdqu16 (%rdi), %zmm1 {%k1} {z}
60 ; AVX512BW-NEXT: vpaddw %zmm1, %zmm0, %zmm0
61 ; AVX512BW-NEXT: retq
83 ; AVX512BW-LABEL: test_int_x86_avx512_mask_loadu_b_512:
84 ; AVX512BW: ## BB#0:
85 ; AVX512BW-NEXT: vmovdqu8 (%rdi), %zmm0
86 ; AVX512BW-NEXT: kmovq %rdx, %k1
87 ; AVX512BW-NEXT: vmovdqu8 (%rsi), %zmm0 {%k1}
88 ; AVX512BW-NEXT: vmovdqu8 (%rdi), %zmm1 {%k1} {z}
89 ; AVX512BW-NEXT: vpaddb %zmm1, %zmm0, %zmm0
90 ; AVX512BW-NEXT: retq
112 ; AVX512BW-LABEL: test_int_x86_avx512_psll_dq_512:
113 ; AVX512BW: ## BB#0:
114 ; AVX512BW-NEXT: vpslldq {{.*#+}} zmm1 = zero,zero,zero,zero,zero,zero,zero,zero,zmm0[0,1,2,3,4,…
115 ; AVX512BW-NEXT: vpslldq {{.*#+}} zmm0 = zero,zero,zero,zero,zmm0[0,1,2,3,4,5,6,7,8,9,10,11],zer…
116 ; AVX512BW-NEXT: vpaddq %zmm0, %zmm1, %zmm0
117 ; AVX512BW-NEXT: retq
132 ; AVX512BW-LABEL: test_int_x86_avx512_psll_load_dq_512:
133 ; AVX512BW: ## BB#0:
134 ; AVX512BW-NEXT: vpslldq {{.*#+}} zmm0 = zero,zero,zero,zero,mem[0,1,2,3,4,5,6,7,8,9,10,11],zero…
135 ; AVX512BW-NEXT: retq
150 ; AVX512BW-LABEL: test_int_x86_avx512_psrl_dq_512:
151 ; AVX512BW: ## BB#0:
152 ; AVX512BW-NEXT: vpsrldq {{.*#+}} zmm1 = zmm0[8,9,10,11,12,13,14,15],zero,zero,zero,zero,zero,ze…
153 ; AVX512BW-NEXT: vpsrldq {{.*#+}} zmm0 = zmm0[4,5,6,7,8,9,10,11,12,13,14,15],zero,zero,zero,zero…
154 ; AVX512BW-NEXT: vpaddq %zmm0, %zmm1, %zmm0
155 ; AVX512BW-NEXT: retq
170 ; AVX512BW-LABEL: test_int_x86_avx512_psrl_load_dq_512:
171 ; AVX512BW: ## BB#0:
172 ; AVX512BW-NEXT: vpsrldq {{.*#+}} zmm0 = mem[4,5,6,7,8,9,10,11,12,13,14,15],zero,zero,zero,zero,…
173 ; AVX512BW-NEXT: retq
188 ; AVX512BW-LABEL: test_int_x86_avx512_mask_palignr_512:
189 ; AVX512BW: ## BB#0:
190 ; AVX512BW-NEXT: vpalignr {{.*#+}} zmm3 = zmm1[2,3,4,5,6,7,8,9,10,11,12,13,14,15],zmm0[0,1],zmm1…
191 ; AVX512BW-NEXT: kmovq %rdi, %k1
192 ; AVX512BW-NEXT: vpalignr {{.*#+}} zmm2 {%k1} = zmm1[2,3,4,5,6,7,8,9,10,11,12,13,14,15],zmm0[0,1…
193 ; AVX512BW-NEXT: vpalignr {{.*#+}} zmm0 {%k1} {z} = zmm1[2,3,4,5,6,7,8,9,10,11,12,13,14,15],zmm0…
194 ; AVX512BW-NEXT: vpaddb %zmm0, %zmm2, %zmm0
195 ; AVX512BW-NEXT: vpaddb %zmm3, %zmm0, %zmm0
196 ; AVX512BW-NEXT: retq
218 ; AVX512BW-LABEL: test_int_x86_avx512_mask_pshufh_w_512:
219 ; AVX512BW: ## BB#0:
220 ; AVX512BW-NEXT: vpshufhw {{.*#+}} zmm2 = zmm0[0,1,2,3,7,4,4,4,8,9,10,11,15,12,12,12,16,17,18,19…
221 ; AVX512BW-NEXT: kmovd %esi, %k1
222 ; AVX512BW-NEXT: vpshufhw {{.*#+}} zmm1 {%k1} = zmm0[0,1,2,3,7,4,4,4,8,9,10,11,15,12,12,12,16,17…
223 ; AVX512BW-NEXT: vpshufhw {{.*#+}} zmm0 {%k1} {z} = zmm0[0,1,2,3,7,4,4,4,8,9,10,11,15,12,12,12,1…
224 ; AVX512BW-NEXT: vpaddw %zmm0, %zmm1, %zmm0
225 ; AVX512BW-NEXT: vpaddw %zmm2, %zmm0, %zmm0
226 ; AVX512BW-NEXT: retq
248 ; AVX512BW-LABEL: test_int_x86_avx512_mask_pshufl_w_512:
249 ; AVX512BW: ## BB#0:
250 ; AVX512BW-NEXT: vpshuflw {{.*#+}} zmm2 = zmm0[3,0,0,0,4,5,6,7,11,8,8,8,12,13,14,15,19,16,16,16,…
251 ; AVX512BW-NEXT: kmovd %esi, %k1
252 ; AVX512BW-NEXT: vpshuflw {{.*#+}} zmm1 {%k1} = zmm0[3,0,0,0,4,5,6,7,11,8,8,8,12,13,14,15,19,16,…
253 ; AVX512BW-NEXT: vpshuflw {{.*#+}} zmm0 {%k1} {z} = zmm0[3,0,0,0,4,5,6,7,11,8,8,8,12,13,14,15,19…
254 ; AVX512BW-NEXT: vpaddw %zmm0, %zmm1, %zmm0
255 ; AVX512BW-NEXT: vpaddw %zmm2, %zmm0, %zmm0
256 ; AVX512BW-NEXT: retq
276 ; AVX512BW-LABEL: test_pcmpeq_b:
277 ; AVX512BW: ## BB#0:
278 ; AVX512BW-NEXT: vpcmpeqb %zmm1, %zmm0, %k0
279 ; AVX512BW-NEXT: kmovq %k0, %rax
280 ; AVX512BW-NEXT: retq
298 ; AVX512BW-LABEL: test_mask_pcmpeq_b:
299 ; AVX512BW: ## BB#0:
300 ; AVX512BW-NEXT: kmovq %rdi, %k1
301 ; AVX512BW-NEXT: vpcmpeqb %zmm1, %zmm0, %k0 {%k1}
302 ; AVX512BW-NEXT: kmovq %k0, %rax
303 ; AVX512BW-NEXT: retq
324 ; AVX512BW-LABEL: test_pcmpeq_w:
325 ; AVX512BW: ## BB#0:
326 ; AVX512BW-NEXT: vpcmpeqw %zmm1, %zmm0, %k0
327 ; AVX512BW-NEXT: kmovd %k0, %eax
328 ; AVX512BW-NEXT: retq
340 ; AVX512BW-LABEL: test_mask_pcmpeq_w:
341 ; AVX512BW: ## BB#0:
342 ; AVX512BW-NEXT: kmovd %edi, %k1
343 ; AVX512BW-NEXT: vpcmpeqw %zmm1, %zmm0, %k0 {%k1}
344 ; AVX512BW-NEXT: kmovd %k0, %eax
345 ; AVX512BW-NEXT: retq
360 ; AVX512BW-LABEL: test_pcmpgt_b:
361 ; AVX512BW: ## BB#0:
362 ; AVX512BW-NEXT: vpcmpgtb %zmm1, %zmm0, %k0
363 ; AVX512BW-NEXT: kmovq %k0, %rax
364 ; AVX512BW-NEXT: retq
382 ; AVX512BW-LABEL: test_mask_pcmpgt_b:
383 ; AVX512BW: ## BB#0:
384 ; AVX512BW-NEXT: kmovq %rdi, %k1
385 ; AVX512BW-NEXT: vpcmpgtb %zmm1, %zmm0, %k0 {%k1}
386 ; AVX512BW-NEXT: kmovq %k0, %rax
387 ; AVX512BW-NEXT: retq
408 ; AVX512BW-LABEL: test_pcmpgt_w:
409 ; AVX512BW: ## BB#0:
410 ; AVX512BW-NEXT: vpcmpgtw %zmm1, %zmm0, %k0
411 ; AVX512BW-NEXT: kmovd %k0, %eax
412 ; AVX512BW-NEXT: retq
424 ; AVX512BW-LABEL: test_mask_pcmpgt_w:
425 ; AVX512BW: ## BB#0:
426 ; AVX512BW-NEXT: kmovd %edi, %k1
427 ; AVX512BW-NEXT: vpcmpgtw %zmm1, %zmm0, %k0 {%k1}
428 ; AVX512BW-NEXT: kmovd %k0, %eax
429 ; AVX512BW-NEXT: retq
446 ; AVX512BW-LABEL: test_int_x86_avx512_mask_punpckhb_w_512:
447 ; AVX512BW: ## BB#0:
448 ; AVX512BW-NEXT: vpunpckhbw {{.*#+}} zmm3 = zmm0[8],zmm1[8],zmm0[9],zmm1[9],zmm0[10],zmm1[10],zm…
449 ; AVX512BW-NEXT: kmovq %rdi, %k1
450 ; AVX512BW-NEXT: vpunpckhbw {{.*#+}} zmm2 {%k1} = zmm0[8],zmm1[8],zmm0[9],zmm1[9],zmm0[10],zmm1[…
451 ; AVX512BW-NEXT: vpaddb %zmm3, %zmm2, %zmm0
452 ; AVX512BW-NEXT: retq
470 ; AVX512BW-LABEL: test_int_x86_avx512_mask_punpcklb_w_512:
471 ; AVX512BW: ## BB#0:
472 ; AVX512BW-NEXT: vpunpcklbw {{.*#+}} zmm3 = zmm0[0],zmm1[0],zmm0[1],zmm1[1],zmm0[2],zmm1[2],zmm0…
473 ; AVX512BW-NEXT: kmovq %rdi, %k1
474 ; AVX512BW-NEXT: vpunpcklbw {{.*#+}} zmm2 {%k1} = zmm0[0],zmm1[0],zmm0[1],zmm1[1],zmm0[2],zmm1[2…
475 ; AVX512BW-NEXT: vpaddb %zmm3, %zmm2, %zmm0
476 ; AVX512BW-NEXT: retq
494 ; AVX512BW-LABEL: test_int_x86_avx512_mask_punpckhw_d_512:
495 ; AVX512BW: ## BB#0:
496 ; AVX512BW-NEXT: vpunpckhwd {{.*#+}} zmm3 = zmm0[4],zmm1[4],zmm0[5],zmm1[5],zmm0[6],zmm1[6],zmm0…
497 ; AVX512BW-NEXT: kmovd %edi, %k1
498 ; AVX512BW-NEXT: vpunpckhwd {{.*#+}} zmm2 {%k1} = zmm0[4],zmm1[4],zmm0[5],zmm1[5],zmm0[6],zmm1[6…
499 ; AVX512BW-NEXT: vpaddw %zmm3, %zmm2, %zmm0
500 ; AVX512BW-NEXT: retq
518 ; AVX512BW-LABEL: test_int_x86_avx512_mask_punpcklw_d_512:
519 ; AVX512BW: ## BB#0:
520 ; AVX512BW-NEXT: vpunpcklwd {{.*#+}} zmm3 = zmm0[0],zmm1[0],zmm0[1],zmm1[1],zmm0[2],zmm1[2],zmm0…
521 ; AVX512BW-NEXT: kmovd %edi, %k1
522 ; AVX512BW-NEXT: vpunpcklwd {{.*#+}} zmm2 {%k1} = zmm0[0],zmm1[0],zmm0[1],zmm1[1],zmm0[2],zmm1[2…
523 ; AVX512BW-NEXT: vpaddw %zmm3, %zmm2, %zmm0
524 ; AVX512BW-NEXT: retq