Searched refs:vhalfrsqrtx5 (Results 1 – 6 of 6) sorted by relevance
/external/XNNPACK/src/f32-vsqrt/gen/ |
D | avx512f-nr1fma1adj-x96.c | 56 __m512 vhalfrsqrtx5 = _mm512_mul_ps(vrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96() local 63 const __m512 vresidual5 = _mm512_fnmadd_ps(vsqrtx5, vhalfrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96() 75 vhalfrsqrtx5 = _mm512_fmadd_ps(vhalfrsqrtx5, vresidual5, vhalfrsqrtx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96() 90 const __m512 vy5 = _mm512_fmadd_ps(vhalfrsqrtx5, vadjustment5, vsqrtx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()
|
D | fma3-nr1fma1adj-x48.c | 57 __m256 vhalfrsqrtx5 = _mm256_mul_ps(vrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x48() local 64 const __m256 vresidual5 = _mm256_fnmadd_ps(vsqrtx5, vhalfrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x48() 76 vhalfrsqrtx5 = _mm256_fmadd_ps(vhalfrsqrtx5, vresidual5, vhalfrsqrtx5); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x48() 91 const __m256 vy5 = _mm256_fmadd_ps(vhalfrsqrtx5, vadjustment5, vsqrtx5); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x48()
|
D | avx512f-nr1fma1adj-x112.c | 58 __m512 vhalfrsqrtx5 = _mm512_mul_ps(vrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112() local 67 const __m512 vresidual5 = _mm512_fnmadd_ps(vsqrtx5, vhalfrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112() 80 vhalfrsqrtx5 = _mm512_fmadd_ps(vhalfrsqrtx5, vresidual5, vhalfrsqrtx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112() 98 const __m512 vy5 = _mm512_fmadd_ps(vhalfrsqrtx5, vadjustment5, vsqrtx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()
|
D | fma3-nr1fma1adj-x56.c | 59 __m256 vhalfrsqrtx5 = _mm256_mul_ps(vrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x56() local 68 const __m256 vresidual5 = _mm256_fnmadd_ps(vsqrtx5, vhalfrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x56() 81 vhalfrsqrtx5 = _mm256_fmadd_ps(vhalfrsqrtx5, vresidual5, vhalfrsqrtx5); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x56() 99 const __m256 vy5 = _mm256_fmadd_ps(vhalfrsqrtx5, vadjustment5, vsqrtx5); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x56()
|
D | avx512f-nr1fma1adj-x128.c | 60 __m512 vhalfrsqrtx5 = _mm512_mul_ps(vrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128() local 71 const __m512 vresidual5 = _mm512_fnmadd_ps(vsqrtx5, vhalfrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128() 85 vhalfrsqrtx5 = _mm512_fmadd_ps(vhalfrsqrtx5, vresidual5, vhalfrsqrtx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128() 106 const __m512 vy5 = _mm512_fmadd_ps(vhalfrsqrtx5, vadjustment5, vsqrtx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()
|
D | fma3-nr1fma1adj-x64.c | 61 __m256 vhalfrsqrtx5 = _mm256_mul_ps(vrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x64() local 72 const __m256 vresidual5 = _mm256_fnmadd_ps(vsqrtx5, vhalfrsqrtx5, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x64() 86 vhalfrsqrtx5 = _mm256_fmadd_ps(vhalfrsqrtx5, vresidual5, vhalfrsqrtx5); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x64() 107 const __m256 vy5 = _mm256_fmadd_ps(vhalfrsqrtx5, vadjustment5, vsqrtx5); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x64()
|