/external/XNNPACK/src/f32-dwconv/gen/ |
D | up16x25-minmax-avx512f-acc2.c | 277 const __m512 vi18x0123456789ABCDEF = _mm512_loadu_ps(i18); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f_acc2() local 410 const __m512 vi18x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i18); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f_acc2() local
|
D | up16x25-minmax-avx512f.c | 277 const __m512 vi18x0123456789ABCDEF = _mm512_loadu_ps(i18); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f() local 408 const __m512 vi18x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i18); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f() local
|
D | up32x25-minmax-avx512f-acc2.c | 332 const __m512 vi18x0123456789ABCDEF = _mm512_loadu_ps(i18); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local 521 const __m512 vi18x0123456789ABCDEF = _mm512_loadu_ps(i18); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local 654 const __m512 vi18x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i18); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local
|
D | up32x25-minmax-avx512f.c | 332 const __m512 vi18x0123456789ABCDEF = _mm512_loadu_ps(i18); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local 518 const __m512 vi18x0123456789ABCDEF = _mm512_loadu_ps(i18); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local 649 const __m512 vi18x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i18); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local
|
/external/XNNPACK/src/qs8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 280 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 440 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 324 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local 586 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 336 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 547 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpunpck.c | 351 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local 622 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpmovsx.c | 330 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local 570 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local
|
D | up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 409 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local 737 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local
|
D | up16x25-minmax-rndnu-neon-mul8-ld128.c | 354 const int8x16_t vi18x0123456789ABCDEF = vld1q_s8(i18); i18 += 16; in xnn_qs8_dwconv_minmax_rndnu_ukernel_up16x25__neon_mul8_ld128() local
|
D | up16x25-minmax-rndnu-neon-mla8-ld128.c | 318 const int8x16_t vi18x0123456789ABCDEF = vld1q_s8(i18); i18 += 16; in xnn_qs8_dwconv_minmax_rndnu_ukernel_up16x25__neon_mla8_ld128() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpunpck.c | 463 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpunpck() local 809 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpmovsx.c | 440 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local 753 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local
|
/external/XNNPACK/src/qu8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 281 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 441 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 337 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 548 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
/external/XNNPACK/src/qc8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 279 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 441 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 335 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 549 … const __m512i vi18x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 324 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local 588 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpmovsx.c | 330 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local 572 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpunpck.c | 351 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local 624 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 409 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local 741 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpmovsx.c | 440 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local 757 … const __m256i vi18x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i18)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local
|
D | up16x25-minmax-fp32-neon-mul8-ld128.c | 352 const int8x16_t vi18x0123456789ABCDEF = vld1q_s8(i18); i18 += 16; in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__neon_mul8_ld128() local
|
D | up16x25-minmax-fp32-neonv8-mul8-ld128.c | 352 const int8x16_t vi18x0123456789ABCDEF = vld1q_s8(i18); i18 += 16; in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__neonv8_mul8_ld128() local
|