Home
last modified time | relevance | path

Searched refs:vxyzw1 (Results 1 – 7 of 7) sorted by relevance

/external/XNNPACK/src/x8-zip/
Dxm-sse2.c50 __m128i vxyzw1 = _mm_unpackhi_epi16(vxy_lo, vzw_lo); in xnn_x8_zip_xm_ukernel__sse2() local
66 *((uint32_t*) output) = _mm_cvtsi128_si32(vxyzw1); in xnn_x8_zip_xm_ukernel__sse2()
68 vxyzw1 = _mm_shufflelo_epi16(vxyzw1, _MM_SHUFFLE(3, 2, 3, 2)); in xnn_x8_zip_xm_ukernel__sse2()
69 *((uint32_t*) output) = _mm_cvtsi128_si32(vxyzw1); in xnn_x8_zip_xm_ukernel__sse2()
71 vxyzw1 = _mm_unpackhi_epi64(vxyzw1, vxyzw1); in xnn_x8_zip_xm_ukernel__sse2()
72 *((uint32_t*) output) = _mm_cvtsi128_si32(vxyzw1); in xnn_x8_zip_xm_ukernel__sse2()
74 vxyzw1 = _mm_shufflelo_epi16(vxyzw1, _MM_SHUFFLE(3, 2, 3, 2)); in xnn_x8_zip_xm_ukernel__sse2()
75 *((uint32_t*) output) = _mm_cvtsi128_si32(vxyzw1); in xnn_x8_zip_xm_ukernel__sse2()
115 __m128i vxyzw1 = _mm_unpackhi_epi16(vxy, vzw); in xnn_x8_zip_xm_ukernel__sse2() local
129 *((uint32_t*) output) = _mm_cvtsi128_si32(vxyzw1); in xnn_x8_zip_xm_ukernel__sse2()
[all …]
Dx4-sse2.c40 const __m128i vxyzw1 = _mm_unpackhi_epi16(vxy_lo, vzw_lo); in xnn_x8_zip_x4_ukernel__sse2() local
44 _mm_storeu_si128((__m128i*) o + 1, vxyzw1); in xnn_x8_zip_x4_ukernel__sse2()
61 const __m128i vxyzw1 = _mm_unpackhi_epi16(vxy_lo, vzw_lo); in xnn_x8_zip_x4_ukernel__sse2() local
66 _mm_storeu_si128((__m128i*) o + 1, vxyzw1); in xnn_x8_zip_x4_ukernel__sse2()
Dxm-neon.c91 uint32x2_t vxyzw1 = vreinterpret_u32_u16(vxyzw_lo.val[1]); in xnn_x8_zip_xm_ukernel__neon() local
102 vst1_lane_u32(__builtin_assume_aligned(output, 1), vxyzw1, 0); in xnn_x8_zip_xm_ukernel__neon()
105 vst1_lane_u32(__builtin_assume_aligned(output, 1), vxyzw1, 1); in xnn_x8_zip_xm_ukernel__neon()
109 vxyzw1 = vxyzw3; in xnn_x8_zip_xm_ukernel__neon()
119 vxyzw0 = vxyzw1; in xnn_x8_zip_xm_ukernel__neon()
/external/XNNPACK/src/x32-zip/
Dx4-wasmsimd.c43 const v128_t vxyzw1 = wasm_v32x4_shuffle(vxy_lo, vzw_lo, 2, 3, 6, 7); in xnn_x32_zip_x4_ukernel__wasmsimd() local
48 wasm_v128_store(o + 4, vxyzw1); in xnn_x32_zip_x4_ukernel__wasmsimd()
Dx4-sse2.c43 const __m128i vxyzw1 = _mm_unpackhi_epi64(vxy_lo, vzw_lo); in xnn_x32_zip_x4_ukernel__sse2() local
48 _mm_storeu_si128((__m128i*) (o + 4), vxyzw1); in xnn_x32_zip_x4_ukernel__sse2()
Dxm-wasmsimd.c57 const v128_t vxyzw1 = wasm_v32x4_shuffle(vxy_lo, vzw_lo, 2, 3, 6, 7); in xnn_x32_zip_xm_ukernel__wasmsimd() local
64 wasm_v128_store(o, vxyzw1); in xnn_x32_zip_xm_ukernel__wasmsimd()
Dxm-sse2.c56 const __m128i vxyzw1 = _mm_unpackhi_epi64(vxy_lo, vzw_lo); in xnn_x32_zip_xm_ukernel__sse2() local
63 _mm_storeu_si128((__m128i*) output, vxyzw1); in xnn_x32_zip_xm_ukernel__sse2()