Home
last modified time | relevance | path

Searched defs:vresidual (Results 1 – 25 of 51) sorted by relevance

123

/external/XNNPACK/src/f32-vsqrt/
Dneonfma-nr2fma1adj.c.in68 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); variable
83 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); variable
Dneonfma-nr1rsqrts1fma1adj.c.in73 const float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); variable
88 const float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); variable
Davx512f-nr1fma1adj.c.in68 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); variable
88 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); variable
Dfma3-nr1fma1adj.c.in67 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); variable
86 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); variable
/external/XNNPACK/src/f32-vsqrt/gen/
Dneonfma-nr2fma1adj-x4.c34 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x4() local
49 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x4() local
Davx512f-nr1fma1adj-x16.c36 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x16() local
56 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x16() local
Dfma3-nr1fma1adj-x8.c35 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x8() local
54 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x8() local
Dneonfma-nr1rsqrts1fma1adj-x4.c37 const float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x4() local
52 const float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x4() local
Davx512f-nr1fma1adj-x32.c67 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x32() local
87 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x32() local
Dneonfma-nr2fma1adj-x8.c71 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x8() local
86 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x8() local
Dfma3-nr1fma1adj-x16.c66 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x16() local
85 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x16() local
Dneonfma-nr1rsqrts1fma1adj-x8.c75 const float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x8() local
90 const float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x8() local
Dfma3-nr1fma1adj-x24.c76 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x24() local
95 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x24() local
Dneonfma-nr2fma1adj-x12.c84 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x12() local
99 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x12() local
Davx512f-nr1fma1adj-x48.c77 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x48() local
97 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x48() local
Dneonfma-nr2fma1adj-x40.c82 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x40() local
175 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x40() local
190 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x40() local
Dneonfma-nr2fma1adj-x16.c97 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x16() local
112 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x16() local
Davx512f-nr1fma1adj-x64.c87 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64() local
107 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64() local
Dfma3-nr1fma1adj-x32.c86 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x32() local
105 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_f32_vsqrt_ukernel__fma3_nr1fma1adj_x32() local
Dneonfma-nr1rsqrts1fma1adj-x12.c88 const float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x12() local
103 const float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x12() local
/external/XNNPACK/src/math/
Dsqrt-avx512f-nr1fma.c35 const __m512 vresidual = _mm512_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_math_f32_sqrt__avx512f_nr1fma() local
Dsqrt-neonfma-nr3fma.c35 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_math_f32_sqrt__neonfma_nr3fma() local
Dsqrt-neonfma-nr2fma.c35 float32x4_t vresidual = vfmsq_f32(vhalf, vsqrtx, vhalfrsqrtx); in xnn_math_f32_sqrt__neonfma_nr2fma() local
Dsqrt-fma3-nr1fma.c35 const __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_math_f32_sqrt__fma3_nr1fma() local
Dsqrt-fma3-nr2fma.c36 __m256 vresidual = _mm256_fnmadd_ps(vsqrtx, vhalfrsqrtx, vhalf); in xnn_math_f32_sqrt__fma3_nr2fma() local

123