Searched refs:vscaleGHIJKLMN (Results 1 – 10 of 10) sorted by relevance
/external/XNNPACK/src/qc8-dwconv/gen/ |
D | up24x9-minmax-fp32-avx2-mul32.c | 205 const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) w + 16); in xnn_qc8_dwconv_minmax_fp32_ukernel_up24x9__avx2_mul32() local 209 vscaledGHIJKLMN = _mm256_mul_ps(vscaledGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up24x9__avx2_mul32()
|
D | up32x9-minmax-fp32-avx2-mul16-add16-vpunpck.c | 229 …const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) ((uintptr_t) w + 16 * sizeof(float))); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx2_mul16_add16_vpunpck() local 234 vfpaccGHIJKLMN = _mm256_mul_ps(vfpaccGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx2_mul16_add16_vpunpck()
|
D | up32x9-minmax-fp32-avx2-mul32.c | 234 const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) w + 16); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx2_mul32() local 239 vscaledGHIJKLMN = _mm256_mul_ps(vscaledGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx2_mul32()
|
D | up32x9-minmax-fp32-avx2-mul16-vpunpck.c | 253 …const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) ((uintptr_t) w + 16 * sizeof(float))); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx2_mul16_vpunpck() local 258 vfpaccGHIJKLMN = _mm256_mul_ps(vfpaccGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx2_mul16_vpunpck()
|
D | up32x9-minmax-fp32-avx2-mul16-vpmovsx.c | 234 …const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) ((uintptr_t) w + 16 * sizeof(float))); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx2_mul16_vpmovsx() local 239 vfpaccGHIJKLMN = _mm256_mul_ps(vfpaccGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x9__avx2_mul16_vpmovsx()
|
D | up24x25-minmax-fp32-avx2-mul32.c | 477 const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) w + 16); in xnn_qc8_dwconv_minmax_fp32_ukernel_up24x25__avx2_mul32() local 481 vscaledGHIJKLMN = _mm256_mul_ps(vscaledGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up24x25__avx2_mul32()
|
D | up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c | 517 …const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) ((uintptr_t) w + 16 * sizeof(float))); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck() local 522 vfpaccGHIJKLMN = _mm256_mul_ps(vfpaccGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_add16_vpunpck()
|
D | up32x25-minmax-fp32-avx2-mul16-vpmovsx.c | 554 …const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) ((uintptr_t) w + 16 * sizeof(float))); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx() local 559 vfpaccGHIJKLMN = _mm256_mul_ps(vfpaccGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpmovsx()
|
D | up32x25-minmax-fp32-avx2-mul32.c | 554 const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) w + 16); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul32() local 559 vscaledGHIJKLMN = _mm256_mul_ps(vscaledGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul32()
|
D | up32x25-minmax-fp32-avx2-mul16-vpunpck.c | 589 …const __m256 vscaleGHIJKLMN = _mm256_loadu_ps((const float*) ((uintptr_t) w + 16 * sizeof(float))); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpunpck() local 594 vfpaccGHIJKLMN = _mm256_mul_ps(vfpaccGHIJKLMN, vscaleGHIJKLMN); in xnn_qc8_dwconv_minmax_fp32_ukernel_up32x25__avx2_mul16_vpunpck()
|