Home
last modified time | relevance | path

Searched refs:_mm_unpacklo_epi64 (Results 1 – 25 of 133) sorted by relevance

123456

/external/python/cpython3/Modules/_blake2/impl/
Dblake2b-load-sse41.h20 b0 = _mm_unpacklo_epi64(m0, m1); \
21 b1 = _mm_unpacklo_epi64(m2, m3); \
36 b0 = _mm_unpacklo_epi64(m4, m5); \
37 b1 = _mm_unpacklo_epi64(m6, m7); \
52 b0 = _mm_unpacklo_epi64(m7, m2); \
60 b0 = _mm_unpacklo_epi64(m5, m4); \
76 b0 = _mm_unpacklo_epi64(m6, m1); \
92 b0 = _mm_unpacklo_epi64(m4, m0); \
108 b0 = _mm_unpacklo_epi64(m7, m3); \
125 b1 = _mm_unpacklo_epi64(m6, m7); \
[all …]
Dblake2b-round.h123 row4l = _mm_unpackhi_epi64(row4h, _mm_unpacklo_epi64(t0, t0)); \
124 row4h = _mm_unpackhi_epi64(t0, _mm_unpacklo_epi64(row4h, row4h)); \
125 row2l = _mm_unpackhi_epi64(row2l, _mm_unpacklo_epi64(row2h, row2h)); \
126 row2h = _mm_unpackhi_epi64(row2h, _mm_unpacklo_epi64(t1, t1))
134 row2l = _mm_unpackhi_epi64(row2h, _mm_unpacklo_epi64(row2l, row2l)); \
135 row2h = _mm_unpackhi_epi64(t0, _mm_unpacklo_epi64(row2h, row2h)); \
136 row4l = _mm_unpackhi_epi64(row4l, _mm_unpacklo_epi64(row4h, row4h)); \
137 row4h = _mm_unpackhi_epi64(row4h, _mm_unpacklo_epi64(t1, t1))
Dblake2s-load-sse41.h97 buf = _mm_unpacklo_epi64(t1,t0);
100 t0 = _mm_unpacklo_epi64(m1,m2); \
107 t1 = _mm_unpacklo_epi64(m0,m1); \
124 buf = _mm_unpacklo_epi64(t0,t1);
138 t0 = _mm_unpacklo_epi64(m1,m2); \
154 t0 = _mm_unpacklo_epi64(m0,m2); \
176 t1 = _mm_unpacklo_epi64(m1,m2); \
183 buf = _mm_unpacklo_epi64(t0,t1);
187 t1 = _mm_unpacklo_epi64(t0,m0); \
/external/libaom/libaom/aom_dsp/x86/
Dtranspose_sse2.h86 out[0] = _mm_unpacklo_epi64(c0, c0); in transpose_8bit_8x8()
88 out[2] = _mm_unpacklo_epi64(c1, c1); in transpose_8bit_8x8()
90 out[4] = _mm_unpacklo_epi64(c2, c2); in transpose_8bit_8x8()
92 out[6] = _mm_unpacklo_epi64(c3, c3); in transpose_8bit_8x8()
156 out[0] = _mm_unpacklo_epi64(b0, b1); in transpose_16bit_4x8()
158 out[2] = _mm_unpacklo_epi64(b2, b3); in transpose_16bit_4x8()
200 out[0] = _mm_unpacklo_epi64(b0, zeros); in transpose_16bit_8x4()
202 out[2] = _mm_unpacklo_epi64(b4, zeros); in transpose_16bit_8x4()
204 out[4] = _mm_unpacklo_epi64(b2, zeros); in transpose_16bit_8x4()
206 out[6] = _mm_unpacklo_epi64(b6, zeros); in transpose_16bit_8x4()
[all …]
Dlpf_common_sse2.h39 *d0 = _mm_unpacklo_epi64(ww0, w2); // 00 10 20 30 40 50 41 51 in highbd_transpose6x6_sse2()
44 *d2 = _mm_unpacklo_epi64(ww0, in highbd_transpose6x6_sse2()
54 *d4 = _mm_unpacklo_epi64(ww0, w5); // 04 14 24 34 44 54 45 55 in highbd_transpose6x6_sse2()
72 *d0 = _mm_unpacklo_epi64(ww0, zero); // 00 10 20 30 xx xx xx xx in highbd_transpose4x8_8x4_low_sse2()
74 *d2 = _mm_unpacklo_epi64(ww1, zero); // 02 12 22 32 xx xx xx xx in highbd_transpose4x8_8x4_low_sse2()
91 *d4 = _mm_unpacklo_epi64(ww2, zero); // 04 14 24 34 xx xx xx xx in highbd_transpose4x8_8x4_high_sse2()
93 *d6 = _mm_unpacklo_epi64(ww3, zero); // 06 16 26 36 xx xx xx xx in highbd_transpose4x8_8x4_high_sse2()
147 *d0 = _mm_unpacklo_epi64(ww0, ww1); // 00 10 20 30 40 50 60 70 in highbd_transpose8x8_low_sse2()
153 *d2 = _mm_unpacklo_epi64(ww0, ww1); // 02 12 22 32 42 52 62 72 in highbd_transpose8x8_low_sse2()
180 *d4 = _mm_unpacklo_epi64(ww0, ww1); // 04 14 24 34 44 54 64 74 in highbd_transpose8x8_high_sse2()
[all …]
Dloopfilter_sse2.c135 *pq0 = _mm_unpacklo_epi64(d0, d1); // pq in transpose_pq_14_inv_sse2()
137 *pq2 = _mm_unpacklo_epi64(d2, d3); // pq in transpose_pq_14_inv_sse2()
215 filter = _mm_unpacklo_epi64(filter, filter); in filter4_dual_sse2()
234 filter2filter1 = _mm_unpacklo_epi64(filter2filter1, filter); in filter4_dual_sse2()
295 q1p1 = _mm_unpacklo_epi64(*p1, *q1); in lpf_internal_4_dual_sse2()
296 q0p0 = _mm_unpacklo_epi64(*p0, *q0); in lpf_internal_4_dual_sse2()
298 p1p0 = _mm_unpacklo_epi64(q0p0, q1p1); in lpf_internal_4_dual_sse2()
321 mask = _mm_unpacklo_epi64(mask, flat); in lpf_internal_4_dual_sse2()
405 p1p0 = _mm_unpacklo_epi64(*q0p0, *q1p1); in lpf_internal_14_dual_sse2()
417 abs_p0q0 = _mm_unpacklo_epi64(abs_p0q0, zero); in lpf_internal_14_dual_sse2()
[all …]
Dhighbd_loopfilter_sse2.c58 x0 = _mm_unpacklo_epi64(x0, x1); in get_limit_dual()
63 x0 = _mm_unpacklo_epi64(x0, x1); in get_limit_dual()
68 x0 = _mm_unpacklo_epi64(x0, x1); in get_limit_dual()
119 *p1p0 = _mm_unpacklo_epi64(pq[0], pq[1]); in highbd_hev_filter_mask_x_sse2()
124 abs_p0q0 = _mm_unpacklo_epi64(abs_p0q0, zero); in highbd_hev_filter_mask_x_sse2()
144 *hev = _mm_unpacklo_epi64(*hev, *hev); in highbd_hev_filter_mask_x_sse2()
241 filt = _mm_unpacklo_epi64(filt, filt); in highbd_filter4_sse2()
247 filt = _mm_unpacklo_epi64(filter2filter1, filter2filter1); in highbd_filter4_sse2()
255 filter1filt = _mm_unpacklo_epi64(filter2filter1, filt); in highbd_filter4_sse2()
336 pq[i] = _mm_unpacklo_epi64(p[i], q[i]); in highbd_lpf_internal_14_sse2()
[all …]
Dsse_avx2.c79 const __m128i v_a0123 = _mm_unpacklo_epi64(_mm_unpacklo_epi32(v_a0, v_a1), in sse_w4x4_avx2()
81 const __m128i v_b0123 = _mm_unpacklo_epi64(_mm_unpacklo_epi32(v_b0, v_b1), in sse_w4x4_avx2()
94 const __m256i v_a_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(v_a0, v_a1)); in sse_w8x2_avx2()
95 const __m256i v_b_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(v_b0, v_b1)); in sse_w8x2_avx2()
236 const __m256i v_a_w = yy_set_m128i(_mm_unpacklo_epi64(v_a0, v_a1), in highbd_sse_w4x4_avx2()
237 _mm_unpacklo_epi64(v_a2, v_a3)); in highbd_sse_w4x4_avx2()
238 const __m256i v_b_w = yy_set_m128i(_mm_unpacklo_epi64(v_b0, v_b1), in highbd_sse_w4x4_avx2()
239 _mm_unpacklo_epi64(v_b2, v_b3)); in highbd_sse_w4x4_avx2()
Dhighbd_convolve_sse2.c43 thirdFilters = _mm_unpacklo_epi64(tmp1, tmp1); // coeffs 4 5 4 5 4 5 4 5 in aom_highbd_filter_block1d4_v4_sse2()
125 thirdFilters = _mm_unpacklo_epi64(tmp_1, tmp_1); // coeffs 4 5 4 5 4 5 4 5 in aom_highbd_filter_block1d4_h4_sse2()
182 thirdFilters = _mm_unpacklo_epi64(tmp1, tmp1); // coeffs 4 5 4 5 4 5 4 5 in aom_highbd_filter_block1d8_v4_sse2()
286 thirdFilters = _mm_unpacklo_epi64(tmp_1, tmp_1); // coeffs 4 5 4 5 4 5 4 5 in aom_highbd_filter_block1d8_h4_sse2()
294 __m128i ss_4 = _mm_unpacklo_epi64(ss_4_1, ss_4_2); in aom_highbd_filter_block1d8_h4_sse2()
304 __m128i ss_3 = _mm_unpacklo_epi64(ss_3_1, ss_3_2); in aom_highbd_filter_block1d8_h4_sse2()
305 __m128i ss_5 = _mm_unpacklo_epi64(ss_5_1, ss_5_2); in aom_highbd_filter_block1d8_h4_sse2()
/external/libvpx/libvpx/vpx_dsp/x86/
Dtranspose_sse2.h85 out[0] = _mm_unpacklo_epi64(c0, c0); in transpose_8bit_8x8()
87 out[2] = _mm_unpacklo_epi64(c1, c1); in transpose_8bit_8x8()
89 out[4] = _mm_unpacklo_epi64(c2, c2); in transpose_8bit_8x8()
91 out[6] = _mm_unpacklo_epi64(c3, c3); in transpose_8bit_8x8()
151 out[0] = _mm_unpacklo_epi64(b0, b1); in transpose_16bit_4x8()
153 out[2] = _mm_unpacklo_epi64(b2, b3); in transpose_16bit_4x8()
213 out[0] = _mm_unpacklo_epi64(b0, b1); in transpose_16bit_8x8()
215 out[2] = _mm_unpacklo_epi64(b4, b5); in transpose_16bit_8x8()
217 out[4] = _mm_unpacklo_epi64(b2, b3); in transpose_16bit_8x8()
219 out[6] = _mm_unpacklo_epi64(b6, b7); in transpose_16bit_8x8()
[all …]
/external/libgav1/libgav1/src/dsp/x86/
Dtranspose_sse4.h149 out[0] = _mm_unpacklo_epi64(b0, b1); in Transpose4x8To8x4_U16()
151 out[2] = _mm_unpacklo_epi64(b2, b3); in Transpose4x8To8x4_U16()
193 out[0] = _mm_unpacklo_epi64(b0, zeros); in Transpose8x4To4x8_U16()
195 out[2] = _mm_unpacklo_epi64(b4, zeros); in Transpose8x4To4x8_U16()
197 out[4] = _mm_unpacklo_epi64(b2, zeros); in Transpose8x4To4x8_U16()
199 out[6] = _mm_unpacklo_epi64(b6, zeros); in Transpose8x4To4x8_U16()
259 out[0] = _mm_unpacklo_epi64(b0, b1); in Transpose8x8_U16()
261 out[2] = _mm_unpacklo_epi64(b4, b5); in Transpose8x8_U16()
263 out[4] = _mm_unpacklo_epi64(b2, b3); in Transpose8x8_U16()
265 out[6] = _mm_unpacklo_epi64(b6, b7); in Transpose8x8_U16()
Dloop_filter_sse4.cc110 const __m128i qp1qp0 = _mm_unpacklo_epi64(qp0, qp1); in Filter4()
132 const __m128i a3a3a1a2 = _mm_unpacklo_epi64(a1a2, a3a3); in Filter4()
1004 *x0 = _mm_unpacklo_epi64(d0, d1); in DualTranspose4x8To8x4()
1008 *x2 = _mm_unpacklo_epi64(d2, d3); in DualTranspose4x8To8x4()
1036 const __m128i qp1qp0 = _mm_unpacklo_epi64(qp0, qp1); in Vertical14()
1258 __m128i oqps1 = _mm_unpacklo_epi64(ops1, oqs1); in Filter4()
1259 __m128i oqps0 = _mm_unpacklo_epi64(ops0, oqs0); in Filter4()
1287 const __m128i p1p0 = _mm_unpacklo_epi64(qp0, qp1); in Horizontal4()
1329 const __m128i qp0 = _mm_unpacklo_epi64(p1p0, q1q0); in Vertical4()
1360 const __m128i p1p0 = _mm_unpacklo_epi64(qp0, qp1); in CheckOuterThreshF6()
[all …]
/external/libavc/common/x86/
Dih264_resi_trans_quant_sse42.c170 src_r0 = _mm_unpacklo_epi64(temp1, zero_8x16b); //a0 b0 c0 d0 in ih264_resi_trans_quant_4x4_sse42()
172 src_r2 = _mm_unpacklo_epi64(temp3, zero_8x16b); //a2 b2 c2 d2 in ih264_resi_trans_quant_4x4_sse42()
208 src_r0 = _mm_unpacklo_epi64(temp1, zero_8x16b); //a0 a1 a2 a3 in ih264_resi_trans_quant_4x4_sse42()
210 src_r2 = _mm_unpacklo_epi64(temp3, zero_8x16b); //c0 c1 c2 c3 in ih264_resi_trans_quant_4x4_sse42()
237 src_r0 = _mm_unpacklo_epi64(src_r0, src_r1); //a0 a1 a2 a3 b0 b1 b2 b3 in ih264_resi_trans_quant_4x4_sse42()
238 src_r2 = _mm_unpacklo_epi64(src_r2, src_r3); //c0 c1 c2 c3 d0 d1 d2 d3 in ih264_resi_trans_quant_4x4_sse42()
453 src_r0 = _mm_unpacklo_epi64(temp1, zero_8x16b); //a0 b0 c0 d0 in ih264_resi_trans_quant_chroma_4x4_sse42()
455 src_r2 = _mm_unpacklo_epi64(temp3, zero_8x16b); //a2 b2 c2 d2 in ih264_resi_trans_quant_chroma_4x4_sse42()
491 src_r0 = _mm_unpacklo_epi64(temp1, zero_8x16b); //a0 a1 a2 a3 in ih264_resi_trans_quant_chroma_4x4_sse42()
493 src_r2 = _mm_unpacklo_epi64(temp3, zero_8x16b); //c0 c1 c2 c3 in ih264_resi_trans_quant_chroma_4x4_sse42()
[all …]
Dih264_ihadamard_scaling_sse42.c129 src_r0 = _mm_unpacklo_epi64(temp0, temp2); //a0 b0 c0 d0 in ih264_ihadamard_scaling_4x4_sse42()
131 src_r2 = _mm_unpacklo_epi64(temp1, temp3); //a2 b2 c2 d2 in ih264_ihadamard_scaling_4x4_sse42()
158 src_r0 = _mm_unpacklo_epi64(temp0, temp2); //a0 a1 a2 a3 in ih264_ihadamard_scaling_4x4_sse42()
160 src_r2 = _mm_unpacklo_epi64(temp1, temp3); //c0 c1 c2 c3 in ih264_ihadamard_scaling_4x4_sse42()
228 …plane_0 = _mm_unpacklo_epi64(temp0, temp1); //a0+a1+a2+a3 a0+a1-a2-a3 a0-a1+a2-a3 a0-a1-a2… in ih264_ihadamard_scaling_2x2_uv_sse42()
Dih264_ihadamard_scaling_ssse3.c131 src_r0 = _mm_unpacklo_epi64(temp0, temp2); //a0 b0 c0 d0 in ih264_ihadamard_scaling_4x4_ssse3()
133 src_r2 = _mm_unpacklo_epi64(temp1, temp3); //a2 b2 c2 d2 in ih264_ihadamard_scaling_4x4_ssse3()
160 src_r0 = _mm_unpacklo_epi64(temp0, temp2); //a0 a1 a2 a3 in ih264_ihadamard_scaling_4x4_ssse3()
162 src_r2 = _mm_unpacklo_epi64(temp1, temp3); //c0 c1 c2 c3 in ih264_ihadamard_scaling_4x4_ssse3()
/external/libhevc/common/x86/
Dihevc_itrans_recon_32x32_ssse3_intr.c1844 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1874 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1904 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1933 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1962 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1992 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
2021 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
2051 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
2080 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
2108 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
[all …]
Dihevc_32x32_itrans_recon_sse42_intr.c1833 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1863 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1893 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1922 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1951 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1981 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
2010 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
2040 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
2069 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
2097 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
[all …]
Dihevc_deblk_ssse3_intr.c150 src_tmp_8x16b = _mm_unpacklo_epi64(src_row0_8x16b, src_row3_8x16b); in ihevc_deblk_luma_vert_ssse3()
260 src_row0_8x16b = _mm_unpacklo_epi64(src_row0_8x16b, src_row2_8x16b); in ihevc_deblk_luma_vert_ssse3()
261 src_row1_8x16b = _mm_unpacklo_epi64(src_row1_8x16b, src_row3_8x16b); in ihevc_deblk_luma_vert_ssse3()
365 src_row0_8x16b = _mm_unpacklo_epi64(temp_pq_str1_16x8b, temp_str0_16x8b); in ihevc_deblk_luma_vert_ssse3()
367 src_row2_8x16b = _mm_unpacklo_epi64(temp_str2_16x8b, temp_pq_str0_16x8b); in ihevc_deblk_luma_vert_ssse3()
398 src_row0_8x16b = _mm_unpacklo_epi64(src_row0_8x16b, src_row1_8x16b); in ihevc_deblk_luma_vert_ssse3()
399 src_row2_8x16b = _mm_unpacklo_epi64(src_row2_8x16b, src_row3_8x16b); in ihevc_deblk_luma_vert_ssse3()
407 tmp_delta2_8x16b = _mm_unpacklo_epi64(tmp_delta2_8x16b, tmp_delta3_8x16b); in ihevc_deblk_luma_vert_ssse3()
437 mask_pq_8x16b = _mm_unpacklo_epi64(mask_pq_8x16b, mask_pq_8x16b); in ihevc_deblk_luma_vert_ssse3()
720 temp_pq0_str0_16x8b = _mm_unpacklo_epi64(temp_pq0_str0_16x8b, temp_str0_16x8b); in ihevc_deblk_luma_horz_ssse3()
[all …]
Dihevc_itrans_recon_sse42_intr.c220 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_4x4_ttype1_sse42()
311 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_4x4_ttype1_sse42()
360 m_temp_reg_0 = _mm_unpacklo_epi64(m_temp_reg_0, m_temp_reg_1); in ihevc_itrans_recon_4x4_ttype1_sse42()
361 m_temp_reg_1 = _mm_unpacklo_epi64(m_temp_reg_2, m_temp_reg_3); in ihevc_itrans_recon_4x4_ttype1_sse42()
530 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_4x4_sse42()
624 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_4x4_sse42()
685 m_temp_reg_0 = _mm_unpacklo_epi64(m_temp_reg_0, m_temp_reg_1); in ihevc_itrans_recon_4x4_sse42()
688 m_temp_reg_1 = _mm_unpacklo_epi64(m_temp_reg_2, m_temp_reg_3); in ihevc_itrans_recon_4x4_sse42()
1072 m_temp_reg_50 = _mm_unpacklo_epi64(m_temp_reg_0, m_temp_reg_4); in ihevc_itrans_recon_8x8_sse42()
1074 m_temp_reg_52 = _mm_unpacklo_epi64(m_temp_reg_1, m_temp_reg_5); in ihevc_itrans_recon_8x8_sse42()
[all …]
/external/libaom/libaom/aom_dsp/simd/
Dv64_intrinsics_x86.h95 ((c) ? _mm_srli_si128(_mm_unpacklo_epi64(b, a), (c)) : b)
172 __m128i t = _mm_unpacklo_epi64(b, a); in v64_pack_s32_s16()
178 __m128i t = _mm_unpacklo_epi64(b, a); in v64_pack_s32_u16()
193 __m128i t = _mm_unpacklo_epi64(b, a); in v64_pack_s16_u8()
198 __m128i t = _mm_unpacklo_epi64(b, a); in v64_pack_s16_s8()
204 return _mm_shuffle_epi8(_mm_unpacklo_epi64(b, a), in v64_unziphi_8()
208 _mm_unpacklo_epi64(_mm_srli_epi16(b, 8), _mm_srli_epi16(a, 8)), in v64_unziphi_8()
215 return _mm_shuffle_epi8(_mm_unpacklo_epi64(b, a), in v64_unziplo_8()
224 return _mm_shuffle_epi8(_mm_unpacklo_epi64(b, a), in v64_unziphi_16()
228 _mm_unpacklo_epi64(_mm_srai_epi32(b, 16), _mm_srai_epi32(a, 16)), in v64_unziphi_16()
[all …]
/external/libhevc/decoder/x86/
Dihevcd_fmt_conv_ssse3_intr.c153 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
166 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
179 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
192 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
228 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
/external/webp/src/dsp/
Dcommon_sse2.h93 *out0 = _mm_unpacklo_epi64(transpose1_0, transpose1_1); in VP8Transpose_2_4x4_16b()
95 *out2 = _mm_unpacklo_epi64(transpose1_2, transpose1_3); in VP8Transpose_2_4x4_16b()
183 *in1 = _mm_unpacklo_epi64(C1, C3); in VP8L32bToPlanar_SSE2()
185 *in3 = _mm_unpacklo_epi64(C0, C2); in VP8L32bToPlanar_SSE2()
/external/XNNPACK/src/x32-zip/
Dx4-sse2.c42 const __m128i vxyzw0 = _mm_unpacklo_epi64(vxy_lo, vzw_lo); in xnn_x32_zip_x4_ukernel__sse2()
44 const __m128i vxyzw2 = _mm_unpacklo_epi64(vxy_hi, vzw_hi); in xnn_x32_zip_x4_ukernel__sse2()
68 const __m128i vxyzw_lo = _mm_unpacklo_epi64(vxy, vzw); in xnn_x32_zip_x4_ukernel__sse2()
/external/libaom/libaom/av1/common/x86/
Dreconinter_avx2.c45 const __m128i s0ABCD = _mm_unpacklo_epi64(s0AB, s0CD); in av1_build_compound_diffwtd_mask_avx2()
54 const __m128i s1ABCD = _mm_unpacklo_epi64(s1AB, s1CD); in av1_build_compound_diffwtd_mask_avx2()
72 const __m256i s0AC_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(s0A, s0C)); in av1_build_compound_diffwtd_mask_avx2()
73 const __m256i s0BD_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(s0B, s0D)); in av1_build_compound_diffwtd_mask_avx2()
78 const __m256i s1AB_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(s1A, s1C)); in av1_build_compound_diffwtd_mask_avx2()
79 const __m256i s1CD_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(s1B, s1D)); in av1_build_compound_diffwtd_mask_avx2()
190 const __m256i s0 = yy_set_m128i(_mm_unpacklo_epi64(s0C, s0D), in build_compound_diffwtd_mask_d16_avx2()
191 _mm_unpacklo_epi64(s0A, s0B)); in build_compound_diffwtd_mask_d16_avx2()
192 const __m256i s1 = yy_set_m128i(_mm_unpacklo_epi64(s1C, s1D), in build_compound_diffwtd_mask_d16_avx2()
193 _mm_unpacklo_epi64(s1A, s1B)); in build_compound_diffwtd_mask_d16_avx2()
[all …]
/external/mesa3d/src/gallium/auxiliary/util/
Du_sse.h263 *o = _mm_unpacklo_epi64(t0, t1); in transpose4_epi32()
265 *q = _mm_unpacklo_epi64(t2, t3); in transpose4_epi32()
289 *o = _mm_unpacklo_epi64(t0, t1); in transpose2_64_2_32()
291 *q = _mm_unpacklo_epi64(t2, t3); in transpose2_64_2_32()

123456