Home
last modified time | relevance | path

Searched refs:_mm_unpacklo_epi64 (Results 1 – 25 of 120) sorted by relevance

12345

/external/python/cpython3/Modules/_blake2/impl/
Dblake2b-load-sse41.h22 b0 = _mm_unpacklo_epi64(m0, m1); \
23 b1 = _mm_unpacklo_epi64(m2, m3); \
38 b0 = _mm_unpacklo_epi64(m4, m5); \
39 b1 = _mm_unpacklo_epi64(m6, m7); \
54 b0 = _mm_unpacklo_epi64(m7, m2); \
62 b0 = _mm_unpacklo_epi64(m5, m4); \
78 b0 = _mm_unpacklo_epi64(m6, m1); \
94 b0 = _mm_unpacklo_epi64(m4, m0); \
110 b0 = _mm_unpacklo_epi64(m7, m3); \
127 b1 = _mm_unpacklo_epi64(m6, m7); \
[all …]
Dblake2b-round.h122 row4l = _mm_unpackhi_epi64(row4h, _mm_unpacklo_epi64(t0, t0)); \
123 row4h = _mm_unpackhi_epi64(t0, _mm_unpacklo_epi64(row4h, row4h)); \
124 row2l = _mm_unpackhi_epi64(row2l, _mm_unpacklo_epi64(row2h, row2h)); \
125 row2h = _mm_unpackhi_epi64(row2h, _mm_unpacklo_epi64(t1, t1))
133 row2l = _mm_unpackhi_epi64(row2h, _mm_unpacklo_epi64(row2l, row2l)); \
134 row2h = _mm_unpackhi_epi64(t0, _mm_unpacklo_epi64(row2h, row2h)); \
135 row4l = _mm_unpackhi_epi64(row4l, _mm_unpacklo_epi64(row4h, row4h)); \
136 row4h = _mm_unpackhi_epi64(row4h, _mm_unpacklo_epi64(t1, t1))
Dblake2s-load-sse41.h99 buf = _mm_unpacklo_epi64(t1,t0);
102 t0 = _mm_unpacklo_epi64(m1,m2); \
109 t1 = _mm_unpacklo_epi64(m0,m1); \
126 buf = _mm_unpacklo_epi64(t0,t1);
140 t0 = _mm_unpacklo_epi64(m1,m2); \
156 t0 = _mm_unpacklo_epi64(m0,m2); \
178 t1 = _mm_unpacklo_epi64(m1,m2); \
185 buf = _mm_unpacklo_epi64(t0,t1);
189 t1 = _mm_unpacklo_epi64(t0,m0); \
/external/libaom/libaom/aom_dsp/x86/
Dtranspose_sse2.h86 out[0] = _mm_unpacklo_epi64(c0, c0); in transpose_8bit_8x8()
88 out[2] = _mm_unpacklo_epi64(c1, c1); in transpose_8bit_8x8()
90 out[4] = _mm_unpacklo_epi64(c2, c2); in transpose_8bit_8x8()
92 out[6] = _mm_unpacklo_epi64(c3, c3); in transpose_8bit_8x8()
156 out[0] = _mm_unpacklo_epi64(b0, b1); in transpose_16bit_4x8()
158 out[2] = _mm_unpacklo_epi64(b2, b3); in transpose_16bit_4x8()
200 out[0] = _mm_unpacklo_epi64(b0, zeros); in transpose_16bit_8x4()
202 out[2] = _mm_unpacklo_epi64(b4, zeros); in transpose_16bit_8x4()
204 out[4] = _mm_unpacklo_epi64(b2, zeros); in transpose_16bit_8x4()
206 out[6] = _mm_unpacklo_epi64(b6, zeros); in transpose_16bit_8x4()
[all …]
Dlpf_common_sse2.h39 *d0 = _mm_unpacklo_epi64(ww0, w2); // 00 10 20 30 40 50 41 51 in highbd_transpose6x6_sse2()
44 *d2 = _mm_unpacklo_epi64(ww0, in highbd_transpose6x6_sse2()
54 *d4 = _mm_unpacklo_epi64(ww0, w5); // 04 14 24 34 44 54 45 55 in highbd_transpose6x6_sse2()
72 *d0 = _mm_unpacklo_epi64(ww0, zero); // 00 10 20 30 xx xx xx xx in highbd_transpose4x8_8x4_low_sse2()
74 *d2 = _mm_unpacklo_epi64(ww1, zero); // 02 12 22 32 xx xx xx xx in highbd_transpose4x8_8x4_low_sse2()
91 *d4 = _mm_unpacklo_epi64(ww2, zero); // 04 14 24 34 xx xx xx xx in highbd_transpose4x8_8x4_high_sse2()
93 *d6 = _mm_unpacklo_epi64(ww3, zero); // 06 16 26 36 xx xx xx xx in highbd_transpose4x8_8x4_high_sse2()
147 *d0 = _mm_unpacklo_epi64(ww0, ww1); // 00 10 20 30 40 50 60 70 in highbd_transpose8x8_low_sse2()
153 *d2 = _mm_unpacklo_epi64(ww0, ww1); // 02 12 22 32 42 52 62 72 in highbd_transpose8x8_low_sse2()
180 *d4 = _mm_unpacklo_epi64(ww0, ww1); // 04 14 24 34 44 54 64 74 in highbd_transpose8x8_high_sse2()
[all …]
Dloopfilter_sse2.c135 *pq0 = _mm_unpacklo_epi64(d0, d1); // pq in transpose_pq_14_inv_sse2()
137 *pq2 = _mm_unpacklo_epi64(d2, d3); // pq in transpose_pq_14_inv_sse2()
215 filter = _mm_unpacklo_epi64(filter, filter); in filter4_dual_sse2()
234 filter2filter1 = _mm_unpacklo_epi64(filter2filter1, filter); in filter4_dual_sse2()
295 q1p1 = _mm_unpacklo_epi64(*p1, *q1); in lpf_internal_4_dual_sse2()
296 q0p0 = _mm_unpacklo_epi64(*p0, *q0); in lpf_internal_4_dual_sse2()
298 p1p0 = _mm_unpacklo_epi64(q0p0, q1p1); in lpf_internal_4_dual_sse2()
321 mask = _mm_unpacklo_epi64(mask, flat); in lpf_internal_4_dual_sse2()
405 p1p0 = _mm_unpacklo_epi64(*q0p0, *q1p1); in lpf_internal_14_dual_sse2()
417 abs_p0q0 = _mm_unpacklo_epi64(abs_p0q0, zero); in lpf_internal_14_dual_sse2()
[all …]
Dhighbd_loopfilter_sse2.c58 x0 = _mm_unpacklo_epi64(x0, x1); in get_limit_dual()
63 x0 = _mm_unpacklo_epi64(x0, x1); in get_limit_dual()
68 x0 = _mm_unpacklo_epi64(x0, x1); in get_limit_dual()
119 *p1p0 = _mm_unpacklo_epi64(pq[0], pq[1]); in highbd_hev_filter_mask_x_sse2()
124 abs_p0q0 = _mm_unpacklo_epi64(abs_p0q0, zero); in highbd_hev_filter_mask_x_sse2()
144 *hev = _mm_unpacklo_epi64(*hev, *hev); in highbd_hev_filter_mask_x_sse2()
241 filt = _mm_unpacklo_epi64(filt, filt); in highbd_filter4_sse2()
247 filt = _mm_unpacklo_epi64(filter2filter1, filter2filter1); in highbd_filter4_sse2()
255 filter1filt = _mm_unpacklo_epi64(filter2filter1, filt); in highbd_filter4_sse2()
336 pq[i] = _mm_unpacklo_epi64(p[i], q[i]); in highbd_lpf_internal_14_sse2()
[all …]
Dsse_avx2.c77 const __m128i v_a0123 = _mm_unpacklo_epi64(_mm_unpacklo_epi32(v_a0, v_a1), in sse_w4x4_avx2()
79 const __m128i v_b0123 = _mm_unpacklo_epi64(_mm_unpacklo_epi32(v_b0, v_b1), in sse_w4x4_avx2()
92 const __m256i v_a_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(v_a0, v_a1)); in sse_w8x2_avx2()
93 const __m256i v_b_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(v_b0, v_b1)); in sse_w8x2_avx2()
233 const __m256i v_a_w = yy_set_m128i(_mm_unpacklo_epi64(v_a0, v_a1), in highbd_sse_w4x4_avx2()
234 _mm_unpacklo_epi64(v_a2, v_a3)); in highbd_sse_w4x4_avx2()
235 const __m256i v_b_w = yy_set_m128i(_mm_unpacklo_epi64(v_b0, v_b1), in highbd_sse_w4x4_avx2()
236 _mm_unpacklo_epi64(v_b2, v_b3)); in highbd_sse_w4x4_avx2()
Dhighbd_convolve_sse2.c43 thirdFilters = _mm_unpacklo_epi64(tmp1, tmp1); // coeffs 4 5 4 5 4 5 4 5 in aom_highbd_filter_block1d4_v4_sse2()
125 thirdFilters = _mm_unpacklo_epi64(tmp_1, tmp_1); // coeffs 4 5 4 5 4 5 4 5 in aom_highbd_filter_block1d4_h4_sse2()
182 thirdFilters = _mm_unpacklo_epi64(tmp1, tmp1); // coeffs 4 5 4 5 4 5 4 5 in aom_highbd_filter_block1d8_v4_sse2()
286 thirdFilters = _mm_unpacklo_epi64(tmp_1, tmp_1); // coeffs 4 5 4 5 4 5 4 5 in aom_highbd_filter_block1d8_h4_sse2()
294 __m128i ss_4 = _mm_unpacklo_epi64(ss_4_1, ss_4_2); in aom_highbd_filter_block1d8_h4_sse2()
304 __m128i ss_3 = _mm_unpacklo_epi64(ss_3_1, ss_3_2); in aom_highbd_filter_block1d8_h4_sse2()
305 __m128i ss_5 = _mm_unpacklo_epi64(ss_5_1, ss_5_2); in aom_highbd_filter_block1d8_h4_sse2()
/external/libvpx/libvpx/vpx_dsp/x86/
Dtranspose_sse2.h85 out[0] = _mm_unpacklo_epi64(c0, c0); in transpose_8bit_8x8()
87 out[2] = _mm_unpacklo_epi64(c1, c1); in transpose_8bit_8x8()
89 out[4] = _mm_unpacklo_epi64(c2, c2); in transpose_8bit_8x8()
91 out[6] = _mm_unpacklo_epi64(c3, c3); in transpose_8bit_8x8()
151 out[0] = _mm_unpacklo_epi64(b0, b1); in transpose_16bit_4x8()
153 out[2] = _mm_unpacklo_epi64(b2, b3); in transpose_16bit_4x8()
213 out[0] = _mm_unpacklo_epi64(b0, b1); in transpose_16bit_8x8()
215 out[2] = _mm_unpacklo_epi64(b4, b5); in transpose_16bit_8x8()
217 out[4] = _mm_unpacklo_epi64(b2, b3); in transpose_16bit_8x8()
219 out[6] = _mm_unpacklo_epi64(b6, b7); in transpose_16bit_8x8()
[all …]
Dhighbd_intrapred_intrin_sse2.c52 _mm_store_si128((__m128i *)dst, _mm_unpacklo_epi64(row0, row0)); in vpx_highbd_h_predictor_8x8_sse2()
54 _mm_store_si128((__m128i *)dst, _mm_unpacklo_epi64(row1, row1)); in vpx_highbd_h_predictor_8x8_sse2()
56 _mm_store_si128((__m128i *)dst, _mm_unpacklo_epi64(row2, row2)); in vpx_highbd_h_predictor_8x8_sse2()
58 _mm_store_si128((__m128i *)dst, _mm_unpacklo_epi64(row3, row3)); in vpx_highbd_h_predictor_8x8_sse2()
71 const __m128i val = _mm_unpacklo_epi64(*row, *row); in h_store_16_unpacklo()
115 const __m128i val = _mm_unpacklo_epi64(*row, *row); in h_store_32_unpacklo()
227 const __m128i dc_dup = _mm_unpacklo_epi64(dc_dup_lo, dc_dup_lo); in dc_store_8x8()
278 const __m128i dc_dup = _mm_unpacklo_epi64(dc_dup_lo, dc_dup_lo); in dc_store_16x16()
333 const __m128i dc_dup = _mm_unpacklo_epi64(dc_dup_lo, dc_dup_lo); in dc_store_32x32()
493 const __m128i IJKLLLLL = _mm_unpacklo_epi64(IJKL0000, LLLL0000); in vpx_highbd_d207_predictor_4x4_sse2()
/external/libavc/common/x86/
Dih264_resi_trans_quant_sse42.c170 src_r0 = _mm_unpacklo_epi64(temp1, zero_8x16b); //a0 b0 c0 d0 in ih264_resi_trans_quant_4x4_sse42()
172 src_r2 = _mm_unpacklo_epi64(temp3, zero_8x16b); //a2 b2 c2 d2 in ih264_resi_trans_quant_4x4_sse42()
208 src_r0 = _mm_unpacklo_epi64(temp1, zero_8x16b); //a0 a1 a2 a3 in ih264_resi_trans_quant_4x4_sse42()
210 src_r2 = _mm_unpacklo_epi64(temp3, zero_8x16b); //c0 c1 c2 c3 in ih264_resi_trans_quant_4x4_sse42()
237 src_r0 = _mm_unpacklo_epi64(src_r0, src_r1); //a0 a1 a2 a3 b0 b1 b2 b3 in ih264_resi_trans_quant_4x4_sse42()
238 src_r2 = _mm_unpacklo_epi64(src_r2, src_r3); //c0 c1 c2 c3 d0 d1 d2 d3 in ih264_resi_trans_quant_4x4_sse42()
453 src_r0 = _mm_unpacklo_epi64(temp1, zero_8x16b); //a0 b0 c0 d0 in ih264_resi_trans_quant_chroma_4x4_sse42()
455 src_r2 = _mm_unpacklo_epi64(temp3, zero_8x16b); //a2 b2 c2 d2 in ih264_resi_trans_quant_chroma_4x4_sse42()
491 src_r0 = _mm_unpacklo_epi64(temp1, zero_8x16b); //a0 a1 a2 a3 in ih264_resi_trans_quant_chroma_4x4_sse42()
493 src_r2 = _mm_unpacklo_epi64(temp3, zero_8x16b); //c0 c1 c2 c3 in ih264_resi_trans_quant_chroma_4x4_sse42()
[all …]
Dih264_ihadamard_scaling_sse42.c129 src_r0 = _mm_unpacklo_epi64(temp0, temp2); //a0 b0 c0 d0 in ih264_ihadamard_scaling_4x4_sse42()
131 src_r2 = _mm_unpacklo_epi64(temp1, temp3); //a2 b2 c2 d2 in ih264_ihadamard_scaling_4x4_sse42()
158 src_r0 = _mm_unpacklo_epi64(temp0, temp2); //a0 a1 a2 a3 in ih264_ihadamard_scaling_4x4_sse42()
160 src_r2 = _mm_unpacklo_epi64(temp1, temp3); //c0 c1 c2 c3 in ih264_ihadamard_scaling_4x4_sse42()
228 …plane_0 = _mm_unpacklo_epi64(temp0, temp1); //a0+a1+a2+a3 a0+a1-a2-a3 a0-a1+a2-a3 a0-a1-a2… in ih264_ihadamard_scaling_2x2_uv_sse42()
Dih264_ihadamard_scaling_ssse3.c131 src_r0 = _mm_unpacklo_epi64(temp0, temp2); //a0 b0 c0 d0 in ih264_ihadamard_scaling_4x4_ssse3()
133 src_r2 = _mm_unpacklo_epi64(temp1, temp3); //a2 b2 c2 d2 in ih264_ihadamard_scaling_4x4_ssse3()
160 src_r0 = _mm_unpacklo_epi64(temp0, temp2); //a0 a1 a2 a3 in ih264_ihadamard_scaling_4x4_ssse3()
162 src_r2 = _mm_unpacklo_epi64(temp1, temp3); //c0 c1 c2 c3 in ih264_ihadamard_scaling_4x4_ssse3()
Dih264_iquant_itrans_recon_sse42.c187 resq_r0 = _mm_unpacklo_epi64(temp1, temp3); //a0 b0 c0 d0 in ih264_iquant_itrans_recon_4x4_sse42()
189 resq_r2 = _mm_unpacklo_epi64(temp2, temp4); //a2 b2 c2 d2 in ih264_iquant_itrans_recon_4x4_sse42()
223 resq_r0 = _mm_unpacklo_epi64(temp1, temp3); //a0 a1 a2 a3 in ih264_iquant_itrans_recon_4x4_sse42()
225 resq_r2 = _mm_unpacklo_epi64(temp2, temp4); //c0 c1 c2 c3 in ih264_iquant_itrans_recon_4x4_sse42()
437 resq_r0 = _mm_unpacklo_epi64(temp1, temp3); //a0 b0 c0 d0 in ih264_iquant_itrans_recon_chroma_4x4_sse42()
439 resq_r2 = _mm_unpacklo_epi64(temp2, temp4); //a2 b2 c2 d2 in ih264_iquant_itrans_recon_chroma_4x4_sse42()
473 resq_r0 = _mm_unpacklo_epi64(temp1, temp3); //a0 a1 a2 a3 in ih264_iquant_itrans_recon_chroma_4x4_sse42()
475 resq_r2 = _mm_unpacklo_epi64(temp2, temp4); //c0 c1 c2 c3 in ih264_iquant_itrans_recon_chroma_4x4_sse42()
/external/libhevc/common/x86/
Dihevc_itrans_recon_32x32_ssse3_intr.c1844 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1874 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1904 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1933 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1962 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
1992 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
2021 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
2051 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
2080 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
2108 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_ssse3()
[all …]
Dihevc_32x32_itrans_recon_sse42_intr.c1833 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1863 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1893 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1922 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1951 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
1981 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
2010 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
2040 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
2069 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
2097 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_32x32_sse42()
[all …]
Dihevc_deblk_ssse3_intr.c150 src_tmp_8x16b = _mm_unpacklo_epi64(src_row0_8x16b, src_row3_8x16b); in ihevc_deblk_luma_vert_ssse3()
260 src_row0_8x16b = _mm_unpacklo_epi64(src_row0_8x16b, src_row2_8x16b); in ihevc_deblk_luma_vert_ssse3()
261 src_row1_8x16b = _mm_unpacklo_epi64(src_row1_8x16b, src_row3_8x16b); in ihevc_deblk_luma_vert_ssse3()
365 src_row0_8x16b = _mm_unpacklo_epi64(temp_pq_str1_16x8b, temp_str0_16x8b); in ihevc_deblk_luma_vert_ssse3()
367 src_row2_8x16b = _mm_unpacklo_epi64(temp_str2_16x8b, temp_pq_str0_16x8b); in ihevc_deblk_luma_vert_ssse3()
398 src_row0_8x16b = _mm_unpacklo_epi64(src_row0_8x16b, src_row1_8x16b); in ihevc_deblk_luma_vert_ssse3()
399 src_row2_8x16b = _mm_unpacklo_epi64(src_row2_8x16b, src_row3_8x16b); in ihevc_deblk_luma_vert_ssse3()
407 tmp_delta2_8x16b = _mm_unpacklo_epi64(tmp_delta2_8x16b, tmp_delta3_8x16b); in ihevc_deblk_luma_vert_ssse3()
437 mask_pq_8x16b = _mm_unpacklo_epi64(mask_pq_8x16b, mask_pq_8x16b); in ihevc_deblk_luma_vert_ssse3()
720 temp_pq0_str0_16x8b = _mm_unpacklo_epi64(temp_pq0_str0_16x8b, temp_str0_16x8b); in ihevc_deblk_luma_horz_ssse3()
[all …]
Dihevc_itrans_recon_sse42_intr.c220 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_4x4_ttype1_sse42()
311 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_4x4_ttype1_sse42()
360 m_temp_reg_0 = _mm_unpacklo_epi64(m_temp_reg_0, m_temp_reg_1); in ihevc_itrans_recon_4x4_ttype1_sse42()
361 m_temp_reg_1 = _mm_unpacklo_epi64(m_temp_reg_2, m_temp_reg_3); in ihevc_itrans_recon_4x4_ttype1_sse42()
530 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_4x4_sse42()
624 m_rdng_factor = _mm_unpacklo_epi64(m_rdng_factor, m_rdng_factor); in ihevc_itrans_recon_4x4_sse42()
685 m_temp_reg_0 = _mm_unpacklo_epi64(m_temp_reg_0, m_temp_reg_1); in ihevc_itrans_recon_4x4_sse42()
688 m_temp_reg_1 = _mm_unpacklo_epi64(m_temp_reg_2, m_temp_reg_3); in ihevc_itrans_recon_4x4_sse42()
1072 m_temp_reg_50 = _mm_unpacklo_epi64(m_temp_reg_0, m_temp_reg_4); in ihevc_itrans_recon_8x8_sse42()
1074 m_temp_reg_52 = _mm_unpacklo_epi64(m_temp_reg_1, m_temp_reg_5); in ihevc_itrans_recon_8x8_sse42()
[all …]
/external/epid-sdk/ext/ipp/sources/ippcp/
Dpcpsms4ecby8cn.h106 K2 = _mm_unpacklo_epi64(K1, K3); \
109 K0 = _mm_unpacklo_epi64(T, K0)
118 T = _mm_unpacklo_epi64(K1, T); \
119 K1 = _mm_unpacklo_epi64(K3, K0); \
/external/libaom/libaom/aom_dsp/simd/
Dv64_intrinsics_x86.h95 ((c) ? _mm_srli_si128(_mm_unpacklo_epi64(b, a), (c)) : b)
172 __m128i t = _mm_unpacklo_epi64(b, a); in v64_pack_s32_s16()
178 __m128i t = _mm_unpacklo_epi64(b, a); in v64_pack_s32_u16()
193 __m128i t = _mm_unpacklo_epi64(b, a); in v64_pack_s16_u8()
198 __m128i t = _mm_unpacklo_epi64(b, a); in v64_pack_s16_s8()
204 return _mm_shuffle_epi8(_mm_unpacklo_epi64(b, a), in v64_unziphi_8()
208 _mm_unpacklo_epi64(_mm_srli_epi16(b, 8), _mm_srli_epi16(a, 8)), in v64_unziphi_8()
215 return _mm_shuffle_epi8(_mm_unpacklo_epi64(b, a), in v64_unziplo_8()
224 return _mm_shuffle_epi8(_mm_unpacklo_epi64(b, a), in v64_unziphi_16()
228 _mm_unpacklo_epi64(_mm_srai_epi32(b, 16), _mm_srai_epi32(a, 16)), in v64_unziphi_16()
[all …]
/external/libhevc/decoder/x86/
Dihevcd_fmt_conv_ssse3_intr.c153 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
166 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
179 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
192 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
228 src_u_8x16b = _mm_unpacklo_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
/external/webp/src/dsp/
Dcommon_sse2.h93 *out0 = _mm_unpacklo_epi64(transpose1_0, transpose1_1); in VP8Transpose_2_4x4_16b()
95 *out2 = _mm_unpacklo_epi64(transpose1_2, transpose1_3); in VP8Transpose_2_4x4_16b()
183 *in1 = _mm_unpacklo_epi64(C1, C3); in VP8L32bToPlanar_SSE2()
185 *in3 = _mm_unpacklo_epi64(C0, C2); in VP8L32bToPlanar_SSE2()
/external/libaom/libaom/av1/common/x86/
Dreconinter_avx2.c45 const __m128i s0ABCD = _mm_unpacklo_epi64(s0AB, s0CD); in av1_build_compound_diffwtd_mask_avx2()
54 const __m128i s1ABCD = _mm_unpacklo_epi64(s1AB, s1CD); in av1_build_compound_diffwtd_mask_avx2()
72 const __m256i s0AC_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(s0A, s0C)); in av1_build_compound_diffwtd_mask_avx2()
73 const __m256i s0BD_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(s0B, s0D)); in av1_build_compound_diffwtd_mask_avx2()
78 const __m256i s1AB_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(s1A, s1C)); in av1_build_compound_diffwtd_mask_avx2()
79 const __m256i s1CD_w = _mm256_cvtepu8_epi16(_mm_unpacklo_epi64(s1B, s1D)); in av1_build_compound_diffwtd_mask_avx2()
190 const __m256i s0 = yy_set_m128i(_mm_unpacklo_epi64(s0C, s0D), in build_compound_diffwtd_mask_d16_avx2()
191 _mm_unpacklo_epi64(s0A, s0B)); in build_compound_diffwtd_mask_d16_avx2()
192 const __m256i s1 = yy_set_m128i(_mm_unpacklo_epi64(s1C, s1D), in build_compound_diffwtd_mask_d16_avx2()
193 _mm_unpacklo_epi64(s1A, s1B)); in build_compound_diffwtd_mask_d16_avx2()
[all …]
/external/mesa3d/src/gallium/auxiliary/util/
Du_sse.h263 *o = _mm_unpacklo_epi64(t0, t1); in transpose4_epi32()
265 *q = _mm_unpacklo_epi64(t2, t3); in transpose4_epi32()
289 *o = _mm_unpacklo_epi64(t0, t1); in transpose2_64_2_32()
291 *q = _mm_unpacklo_epi64(t2, t3); in transpose2_64_2_32()

12345