/external/XNNPACK/src/f32-dwconv/gen/ |
D | up16x25-minmax-avx512f-acc2.c | 265 const __m512 vi16x0123456789ABCDEF = _mm512_loadu_ps(i16); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f_acc2() local 402 const __m512 vi16x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i16); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f_acc2() local
|
D | up16x25-minmax-avx512f.c | 265 const __m512 vi16x0123456789ABCDEF = _mm512_loadu_ps(i16); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f() local 400 const __m512 vi16x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i16); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f() local
|
D | up32x25-minmax-avx512f-acc2.c | 314 const __m512 vi16x0123456789ABCDEF = _mm512_loadu_ps(i16); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local 509 const __m512 vi16x0123456789ABCDEF = _mm512_loadu_ps(i16); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local 646 const __m512 vi16x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i16); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local
|
D | up32x25-minmax-avx512f.c | 314 const __m512 vi16x0123456789ABCDEF = _mm512_loadu_ps(i16); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local 506 const __m512 vi16x0123456789ABCDEF = _mm512_loadu_ps(i16); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local 641 const __m512 vi16x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i16); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local
|
/external/XNNPACK/src/qs8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 268 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 430 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 307 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local 568 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 318 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 535 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpunpck.c | 331 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local 604 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpmovsx.c | 312 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local 554 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local
|
D | up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 383 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local 717 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local
|
D | up16x25-minmax-rndnu-neon-mul8-ld128.c | 334 const int8x16_t vi16x0123456789ABCDEF = vld1q_s8(i16); i16 += 16; in xnn_qs8_dwconv_minmax_rndnu_ukernel_up16x25__neon_mul8_ld128() local
|
D | up16x25-minmax-rndnu-neon-mla8-ld128.c | 302 const int8x16_t vi16x0123456789ABCDEF = vld1q_s8(i16); i16 += 16; in xnn_qs8_dwconv_minmax_rndnu_ukernel_up16x25__neon_mla8_ld128() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpunpck.c | 431 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpunpck() local 789 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpmovsx.c | 410 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local 735 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local
|
/external/XNNPACK/src/qu8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 269 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 431 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 319 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 536 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
/external/XNNPACK/src/qc8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 267 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 431 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 317 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 537 … const __m512i vi16x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 307 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local 570 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpmovsx.c | 312 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local 556 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpunpck.c | 331 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local 606 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 383 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local 721 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpmovsx.c | 410 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local 739 … const __m256i vi16x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i16)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local
|
D | up16x25-minmax-fp32-neon-mul8-ld128.c | 332 const int8x16_t vi16x0123456789ABCDEF = vld1q_s8(i16); i16 += 16; in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__neon_mul8_ld128() local
|
D | up16x25-minmax-fp32-neonv8-mul8-ld128.c | 332 const int8x16_t vi16x0123456789ABCDEF = vld1q_s8(i16); i16 += 16; in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__neonv8_mul8_ld128() local
|