Searched refs:vyWXYZ (Results 1 – 8 of 8) sorted by relevance
/external/XNNPACK/src/qu8-f32-vcvt/gen/ |
D | vcvt-avx512skx-x48.c | 44 __m512 vyWXYZ = _mm512_cvtepi32_ps(vxWXYZ); in xnn_qu8_f32_vcvt_ukernel__avx512skx_x48() local 48 vyWXYZ = _mm512_mul_ps(vyWXYZ, vscale); in xnn_qu8_f32_vcvt_ukernel__avx512skx_x48() 52 _mm512_storeu_ps(y + 32, vyWXYZ); in xnn_qu8_f32_vcvt_ukernel__avx512skx_x48()
|
D | vcvt-avx512skx-x64.c | 46 __m512 vyWXYZ = _mm512_cvtepi32_ps(vxWXYZ); in xnn_qu8_f32_vcvt_ukernel__avx512skx_x64() local 51 vyWXYZ = _mm512_mul_ps(vyWXYZ, vscale); in xnn_qu8_f32_vcvt_ukernel__avx512skx_x64() 56 _mm512_storeu_ps(y + 32, vyWXYZ); in xnn_qu8_f32_vcvt_ukernel__avx512skx_x64()
|
/external/XNNPACK/src/qs8-f32-vcvt/gen/ |
D | vcvt-avx512skx-x48.c | 44 __m512 vyWXYZ = _mm512_cvtepi32_ps(vxWXYZ); in xnn_qs8_f32_vcvt_ukernel__avx512skx_x48() local 48 vyWXYZ = _mm512_mul_ps(vyWXYZ, vscale); in xnn_qs8_f32_vcvt_ukernel__avx512skx_x48() 52 _mm512_storeu_ps(y + 32, vyWXYZ); in xnn_qs8_f32_vcvt_ukernel__avx512skx_x48()
|
D | vcvt-avx512skx-x64.c | 46 __m512 vyWXYZ = _mm512_cvtepi32_ps(vxWXYZ); in xnn_qs8_f32_vcvt_ukernel__avx512skx_x64() local 51 vyWXYZ = _mm512_mul_ps(vyWXYZ, vscale); in xnn_qs8_f32_vcvt_ukernel__avx512skx_x64() 56 _mm512_storeu_ps(y + 32, vyWXYZ); in xnn_qs8_f32_vcvt_ukernel__avx512skx_x64()
|
/external/XNNPACK/src/f32-vsqrt/gen/ |
D | neonfma-nr1rsqrts1fma1adj-x36.c | 146 const float32x4_t vyWXYZ = vfmaq_f32(vsqrtxWXYZ, vhalfrsqrtxWXYZ, vadjustmentWXYZ); in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x36() local 156 vst1q_f32(y, vyWXYZ); y += 4; in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x36()
|
D | neonfma-nr2fma1adj-x36.c | 145 const float32x4_t vyWXYZ = vfmaq_f32(vsqrtxWXYZ, vhalfrsqrtxWXYZ, vadjustmentWXYZ); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x36() local 155 vst1q_f32(y, vyWXYZ); y += 4; in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x36()
|
D | neonfma-nr2fma1adj-x40.c | 156 const float32x4_t vyWXYZ = vfmaq_f32(vsqrtxWXYZ, vhalfrsqrtxWXYZ, vadjustmentWXYZ); in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x40() local 167 vst1q_f32(y, vyWXYZ); y += 4; in xnn_f32_vsqrt_ukernel__neonfma_nr2fma1adj_x40()
|
D | neonfma-nr1rsqrts1fma1adj-x40.c | 157 const float32x4_t vyWXYZ = vfmaq_f32(vsqrtxWXYZ, vhalfrsqrtxWXYZ, vadjustmentWXYZ); in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x40() local 168 vst1q_f32(y, vyWXYZ); y += 4; in xnn_f32_vsqrt_ukernel__neonfma_nr1rsqrts1fma1adj_x40()
|