Searched refs:vacc89ABCDEFp1 (Results 1 – 6 of 6) sorted by relevance
/external/XNNPACK/src/f32-dwconv/gen/ |
D | up16x25-fma3-acc2.c | 110 __m256 vacc89ABCDEFp1 = _mm256_mul_ps(vi1x89ABCDEF, vk1x89ABCDEF); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() local 128 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi3x89ABCDEF, vk3x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() 146 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi5x89ABCDEF, vk5x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() 164 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi7x89ABCDEF, vk7x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() 182 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi9x89ABCDEF, vk9x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() 200 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi11x89ABCDEF, vk11x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() 218 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi13x89ABCDEF, vk13x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() 236 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi15x89ABCDEF, vk15x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() 254 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi17x89ABCDEF, vk17x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() 272 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi19x89ABCDEF, vk19x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x25__fma3_acc2() [all …]
|
D | up16x25-avx-acc2.c | 110 __m256 vacc89ABCDEFp1 = _mm256_mul_ps(vi1x89ABCDEF, vk1x89ABCDEF); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() local 128 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi3x89ABCDEF, vk3x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() 146 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi5x89ABCDEF, vk5x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() 164 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi7x89ABCDEF, vk7x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() 182 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi9x89ABCDEF, vk9x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() 200 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi11x89ABCDEF, vk11x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() 218 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi13x89ABCDEF, vk13x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() 236 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi15x89ABCDEF, vk15x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() 254 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi17x89ABCDEF, vk17x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() 272 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi19x89ABCDEF, vk19x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x25__avx_acc2() [all …]
|
D | up16x9-fma3-acc2.c | 78 __m256 vacc89ABCDEFp1 = _mm256_mul_ps(vi1x89ABCDEF, vk1x89ABCDEF); in xnn_f32_dwconv_ukernel_up16x9__fma3_acc2() local 96 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi3x89ABCDEF, vk3x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x9__fma3_acc2() 114 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi5x89ABCDEF, vk5x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x9__fma3_acc2() 132 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi7x89ABCDEF, vk7x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x9__fma3_acc2() 147 vacc89ABCDEFp0 = _mm256_add_ps(vacc89ABCDEFp0, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x9__fma3_acc2()
|
D | up16x9-avx-acc2.c | 78 __m256 vacc89ABCDEFp1 = _mm256_mul_ps(vi1x89ABCDEF, vk1x89ABCDEF); in xnn_f32_dwconv_ukernel_up16x9__avx_acc2() local 96 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi3x89ABCDEF, vk3x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x9__avx_acc2() 114 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi5x89ABCDEF, vk5x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x9__avx_acc2() 132 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi7x89ABCDEF, vk7x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x9__avx_acc2() 147 vacc89ABCDEFp0 = _mm256_add_ps(vacc89ABCDEFp0, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x9__avx_acc2()
|
D | up16x4-avx-acc2.c | 68 __m256 vacc89ABCDEFp1 = _mm256_mul_ps(vi1x89ABCDEF, vk1x89ABCDEF); in xnn_f32_dwconv_ukernel_up16x4__avx_acc2() local 86 vacc89ABCDEFp1 = _mm256_add_ps(vacc89ABCDEFp1, _mm256_mul_ps(vi3x89ABCDEF, vk3x89ABCDEF)); in xnn_f32_dwconv_ukernel_up16x4__avx_acc2() 92 vacc89ABCDEFp0 = _mm256_add_ps(vacc89ABCDEFp0, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x4__avx_acc2()
|
D | up16x4-fma3-acc2.c | 68 __m256 vacc89ABCDEFp1 = _mm256_mul_ps(vi1x89ABCDEF, vk1x89ABCDEF); in xnn_f32_dwconv_ukernel_up16x4__fma3_acc2() local 86 vacc89ABCDEFp1 = _mm256_fmadd_ps(vi3x89ABCDEF, vk3x89ABCDEF, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x4__fma3_acc2() 92 vacc89ABCDEFp0 = _mm256_add_ps(vacc89ABCDEFp0, vacc89ABCDEFp1); in xnn_f32_dwconv_ukernel_up16x4__fma3_acc2()
|