/external/XNNPACK/src/f32-dwconv/gen/ |
D | up16x25-minmax-avx512f-acc2.c | 313 const __m512 vi24x0123456789ABCDEF = _mm512_loadu_ps(i24); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f_acc2() local 434 const __m512 vi24x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i24); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f_acc2() local
|
D | up16x25-minmax-avx512f.c | 313 const __m512 vi24x0123456789ABCDEF = _mm512_loadu_ps(i24); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f() local 432 const __m512 vi24x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i24); in xnn_f32_dwconv_minmax_ukernel_up16x25__avx512f() local
|
D | up32x25-minmax-avx512f-acc2.c | 386 const __m512 vi24x0123456789ABCDEF = _mm512_loadu_ps(i24); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local 557 const __m512 vi24x0123456789ABCDEF = _mm512_loadu_ps(i24); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local 678 const __m512 vi24x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i24); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f_acc2() local
|
D | up32x25-minmax-avx512f.c | 386 const __m512 vi24x0123456789ABCDEF = _mm512_loadu_ps(i24); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local 554 const __m512 vi24x0123456789ABCDEF = _mm512_loadu_ps(i24); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local 673 const __m512 vi24x0123456789ABCDEF = _mm512_maskz_loadu_ps(vmask, i24); in xnn_f32_dwconv_minmax_ukernel_up32x25__avx512f() local
|
/external/XNNPACK/src/qs8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 316 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 470 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 375 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local 640 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 390 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 583 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpunpck.c | 411 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local 676 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpmovsx.c | 384 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local 618 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local
|
D | up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 487 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local 797 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local
|
D | up16x25-minmax-rndnu-neon-mul8-ld128.c | 414 const int8x16_t vi24x0123456789ABCDEF = vld1q_s8(i24); i24 += 16; in xnn_qs8_dwconv_minmax_rndnu_ukernel_up16x25__neon_mul8_ld128() local
|
D | up16x25-minmax-rndnu-neon-mla8-ld128.c | 366 const int8x16_t vi24x0123456789ABCDEF = vld1q_s8(i24); i24 += 16; in xnn_qs8_dwconv_minmax_rndnu_ukernel_up16x25__neon_mla8_ld128() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpunpck.c | 559 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpunpck() local 869 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpmovsx.c | 530 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local 807 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qs8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local
|
/external/XNNPACK/src/qu8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 317 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 471 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 391 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 584 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepu8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qu8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
/external/XNNPACK/src/qc8-dwconv/gen/ |
D | up16x25-minmax-fp32-avx512skx-mul32.c | 315 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local 471 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx512skx_mul32() local
|
D | up32x25-minmax-fp32-avx512skx-mul32.c | 389 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local 585 … const __m512i vi24x0123456789ABCDEF = _mm512_cvtepi8_epi32(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx512skx_mul32() local
|
D | up16x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 375 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local 642 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_add16_vpunpck() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpmovsx.c | 384 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local 620 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpmovsx() local
|
D | up16x25-minmax-fp32-avx2-mul16-vpunpck.c | 411 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local 678 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__avx2_mul16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 487 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local 801 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local
|
D | up32x25-minmax-fp32-avx2-mul16-vpmovsx.c | 530 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local 811 … const __m256i vi24x0123456789ABCDEF = _mm256_cvtepi8_epi16(_mm_loadu_si128((const __m128i*) i24)); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local
|
D | up16x25-minmax-fp32-neon-mul8-ld128.c | 412 const int8x16_t vi24x0123456789ABCDEF = vld1q_s8(i24); i24 += 16; in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__neon_mul8_ld128() local
|
D | up16x25-minmax-fp32-neonv8-mul8-ld128.c | 412 const int8x16_t vi24x0123456789ABCDEF = vld1q_s8(i24); i24 += 16; in xnn_qc8_dwconv_minmax_fp32_ukernel_up16x25__neonv8_mul8_ld128() local
|