Home
last modified time | relevance | path

Searched refs:vdenorm4 (Results 1 – 21 of 21) sorted by relevance

/external/XNNPACK/src/f16-f32-vcvt/gen/
Dvcvt-wasmsimd-int16-x24.c69 …const v128_t vdenorm4 = wasm_f32x4_sub(wasm_v16x8_shuffle(vnonsign2, vmagic_mask, 0, 8, 1, 9, 2,… in xnn_f16_f32_vcvt_ukernel__wasmsimd_int16_x24() local
93 wasm_v128_bitselect(vnorm4, vdenorm4, vxmask4)); in xnn_f16_f32_vcvt_ukernel__wasmsimd_int16_x24()
Dvcvt-sse41-int16-x24.c69 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_unpacklo_epi16(vnonsign2… in xnn_f16_f32_vcvt_ukernel__sse41_int16_x24() local
85 _mm_blendv_epi8(vdenorm4, vnorm4, _mm_cvtepi16_epi32(vmask2))); in xnn_f16_f32_vcvt_ukernel__sse41_int16_x24()
Dvcvt-avx-int16-x24.c69 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_unpacklo_epi16(vnonsign2… in xnn_f16_f32_vcvt_ukernel__avx_int16_x24() local
85 _mm_blendv_epi8(vdenorm4, vnorm4, _mm_cvtepi16_epi32(vmask2))); in xnn_f16_f32_vcvt_ukernel__avx_int16_x24()
Dvcvt-wasmsimd-int32-x24.c75 …const v128_t vdenorm4 = wasm_f32x4_sub(wasm_v128_or(wasm_u32x4_shr(vnonsign4, 16), vmagic_bias), v… in xnn_f16_f32_vcvt_ukernel__wasmsimd_int32_x24() local
89 const v128_t vf4 = wasm_v128_or(vsign4, wasm_v128_bitselect(vnorm4, vdenorm4, vxmask4)); in xnn_f16_f32_vcvt_ukernel__wasmsimd_int32_x24()
Dvcvt-sse2-int16-x24.c69 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_unpacklo_epi16(vnonsign2… in xnn_f16_f32_vcvt_ukernel__sse2_int16_x24() local
90 _mm_or_si128(_mm_and_si128(vxmask4, vnorm4), _mm_andnot_si128(vxmask4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__sse2_int16_x24()
Dvcvt-neon-int16-x24.c64 …const float32x4_t vdenorm4 = vsubq_f32(vreinterpretq_f32_u32(vaddw_u16(vmagic_bias, vget_low_u16(v… in xnn_f16_f32_vcvt_ukernel__neon_int16_x24() local
79 vreinterpretq_u32_f32(vbslq_f32(vxmask4, vnorm4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__neon_int16_x24()
Dvcvt-sse41-int32-x24.c74 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_or_si128(_mm_srli_epi32(… in xnn_f16_f32_vcvt_ukernel__sse41_int32_x24() local
88 const __m128i vf4 = _mm_or_si128(vsign4, _mm_blendv_epi8(vdenorm4, vnorm4, vmask4)); in xnn_f16_f32_vcvt_ukernel__sse41_int32_x24()
Dvcvt-neon-int32-x24.c73 …const float32x4_t vdenorm4 = vsubq_f32(vreinterpretq_f32_u32(vsriq_n_u32(vmagic_bias, vnonsign4, 1… in xnn_f16_f32_vcvt_ukernel__neon_int32_x24() local
87 …st uint32x4_t vf4 = vorrq_u32(vsign4, vreinterpretq_u32_f32(vbslq_f32(vxmask4, vnorm4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__neon_int32_x24()
Dvcvt-wasmsimd-int16-x32.c76 …const v128_t vdenorm4 = wasm_f32x4_sub(wasm_v16x8_shuffle(vnonsign2, vmagic_mask, 0, 8, 1, 9, 2,… in xnn_f16_f32_vcvt_ukernel__wasmsimd_int16_x32() local
105 wasm_v128_bitselect(vnorm4, vdenorm4, vxmask4)); in xnn_f16_f32_vcvt_ukernel__wasmsimd_int16_x32()
Dvcvt-avx-int32-x24.c74 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_or_si128(_mm_srli_epi32(… in xnn_f16_f32_vcvt_ukernel__avx_int32_x24() local
88 const __m128i vf4 = _mm_or_si128(vsign4, _mm_blendv_epi8(vdenorm4, vnorm4, vmask4)); in xnn_f16_f32_vcvt_ukernel__avx_int32_x24()
Dvcvt-sse41-int16-x32.c76 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_unpacklo_epi16(vnonsign2… in xnn_f16_f32_vcvt_ukernel__sse41_int16_x32() local
95 _mm_blendv_epi8(vdenorm4, vnorm4, _mm_cvtepi16_epi32(vmask2))); in xnn_f16_f32_vcvt_ukernel__sse41_int16_x32()
Dvcvt-avx-int16-x32.c76 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_unpacklo_epi16(vnonsign2… in xnn_f16_f32_vcvt_ukernel__avx_int16_x32() local
95 _mm_blendv_epi8(vdenorm4, vnorm4, _mm_cvtepi16_epi32(vmask2))); in xnn_f16_f32_vcvt_ukernel__avx_int16_x32()
Dvcvt-neon-int16-x32.c70 …const float32x4_t vdenorm4 = vsubq_f32(vreinterpretq_f32_u32(vaddw_u16(vmagic_bias, vget_low_u16(v… in xnn_f16_f32_vcvt_ukernel__neon_int16_x32() local
88 vreinterpretq_u32_f32(vbslq_f32(vxmask4, vnorm4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__neon_int16_x32()
Dvcvt-sse2-int32-x24.c74 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_or_si128(_mm_srli_epi32(… in xnn_f16_f32_vcvt_ukernel__sse2_int32_x24() local
93 _mm_or_si128(_mm_and_si128(vmask4, vnorm4), _mm_andnot_si128(vmask4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__sse2_int32_x24()
Dvcvt-neon-int32-x32.c82 …const float32x4_t vdenorm4 = vsubq_f32(vreinterpretq_f32_u32(vsriq_n_u32(vmagic_bias, vnonsign4, 1… in xnn_f16_f32_vcvt_ukernel__neon_int32_x32() local
100 …st uint32x4_t vf4 = vorrq_u32(vsign4, vreinterpretq_u32_f32(vbslq_f32(vxmask4, vnorm4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__neon_int32_x32()
Dvcvt-wasmsimd-int32-x32.c84 …const v128_t vdenorm4 = wasm_f32x4_sub(wasm_v128_or(wasm_u32x4_shr(vnonsign4, 16), vmagic_bias), v… in xnn_f16_f32_vcvt_ukernel__wasmsimd_int32_x32() local
102 const v128_t vf4 = wasm_v128_or(vsign4, wasm_v128_bitselect(vnorm4, vdenorm4, vxmask4)); in xnn_f16_f32_vcvt_ukernel__wasmsimd_int32_x32()
Dvcvt-avx-int32-x32.c83 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_or_si128(_mm_srli_epi32(… in xnn_f16_f32_vcvt_ukernel__avx_int32_x32() local
101 const __m128i vf4 = _mm_or_si128(vsign4, _mm_blendv_epi8(vdenorm4, vnorm4, vmask4)); in xnn_f16_f32_vcvt_ukernel__avx_int32_x32()
Dvcvt-sse2-int16-x32.c76 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_unpacklo_epi16(vnonsign2… in xnn_f16_f32_vcvt_ukernel__sse2_int16_x32() local
100 _mm_or_si128(_mm_and_si128(vxmask4, vnorm4), _mm_andnot_si128(vxmask4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__sse2_int16_x32()
Dvcvt-sse41-int32-x32.c83 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_or_si128(_mm_srli_epi32(… in xnn_f16_f32_vcvt_ukernel__sse41_int32_x32() local
101 const __m128i vf4 = _mm_or_si128(vsign4, _mm_blendv_epi8(vdenorm4, vnorm4, vmask4)); in xnn_f16_f32_vcvt_ukernel__sse41_int32_x32()
Dvcvt-sse2-int32-x32.c83 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_or_si128(_mm_srli_epi32(… in xnn_f16_f32_vcvt_ukernel__sse2_int32_x32() local
106 _mm_or_si128(_mm_and_si128(vmask4, vnorm4), _mm_andnot_si128(vmask4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__sse2_int32_x32()
/external/XNNPACK/src/amalgam/
Dsse2.c95 …const __m128i vdenorm4 = _mm_castps_si128(_mm_sub_ps(_mm_castsi128_ps(_mm_unpacklo_epi16(vnonsign2… in xnn_f16_f32_vcvt_ukernel__sse2_int16_x32() local
119 _mm_or_si128(_mm_and_si128(vxmask4, vnorm4), _mm_andnot_si128(vxmask4, vdenorm4))); in xnn_f16_f32_vcvt_ukernel__sse2_int16_x32()