Home
last modified time | relevance | path

Searched refs:_mm_unpackhi_epi64 (Results 1 – 25 of 106) sorted by relevance

12345

/external/python/cpython3/Modules/_blake2/impl/
Dblake2b-load-sse41.h30 b0 = _mm_unpackhi_epi64(m0, m1); \
31 b1 = _mm_unpackhi_epi64(m2, m3); \
46 b0 = _mm_unpackhi_epi64(m4, m5); \
47 b1 = _mm_unpackhi_epi64(m6, m7); \
55 b1 = _mm_unpackhi_epi64(m4, m6); \
71 b1 = _mm_unpackhi_epi64(m5, m2); \
79 b1 = _mm_unpackhi_epi64(m3, m1); \
87 b1 = _mm_unpackhi_epi64(m2, m7); \
103 b1 = _mm_unpackhi_epi64(m3, m4); \
118 b0 = _mm_unpackhi_epi64(m3, m1); \
[all …]
Dblake2b-round.h122 row4l = _mm_unpackhi_epi64(row4h, _mm_unpacklo_epi64(t0, t0)); \
123 row4h = _mm_unpackhi_epi64(t0, _mm_unpacklo_epi64(row4h, row4h)); \
124 row2l = _mm_unpackhi_epi64(row2l, _mm_unpacklo_epi64(row2h, row2h)); \
125 row2h = _mm_unpackhi_epi64(row2h, _mm_unpacklo_epi64(t1, t1))
133 row2l = _mm_unpackhi_epi64(row2h, _mm_unpacklo_epi64(row2l, row2l)); \
134 row2h = _mm_unpackhi_epi64(t0, _mm_unpacklo_epi64(row2h, row2h)); \
135 row4l = _mm_unpackhi_epi64(row4l, _mm_unpacklo_epi64(row4h, row4h)); \
136 row4h = _mm_unpackhi_epi64(row4h, _mm_unpacklo_epi64(t1, t1))
Dblake2s-load-sse41.h103 t1 = _mm_unpackhi_epi64(m0,m2); \
108 t0 = _mm_unpackhi_epi64(m1,m3); \
113 t0 = _mm_unpackhi_epi64(m3,m1); \
114 t1 = _mm_unpackhi_epi64(m2,m0); \
162 t1 = _mm_unpackhi_epi64(m0,t0); \
177 t0 = _mm_unpackhi_epi64(m0,m3); \
221 t2 = _mm_unpackhi_epi64(t0,t1); \
/external/libaom/libaom/aom_dsp/x86/
Dtranspose_sse2.h87 out[1] = _mm_unpackhi_epi64(c0, c0); in transpose_8bit_8x8()
89 out[3] = _mm_unpackhi_epi64(c1, c1); in transpose_8bit_8x8()
91 out[5] = _mm_unpackhi_epi64(c2, c2); in transpose_8bit_8x8()
93 out[7] = _mm_unpackhi_epi64(c3, c3); in transpose_8bit_8x8()
157 out[1] = _mm_unpackhi_epi64(b0, b1); in transpose_16bit_4x8()
159 out[3] = _mm_unpackhi_epi64(b2, b3); in transpose_16bit_4x8()
201 out[1] = _mm_unpackhi_epi64(b0, zeros); in transpose_16bit_8x4()
203 out[3] = _mm_unpackhi_epi64(b4, zeros); in transpose_16bit_8x4()
205 out[5] = _mm_unpackhi_epi64(b2, zeros); in transpose_16bit_8x4()
207 out[7] = _mm_unpackhi_epi64(b6, zeros); in transpose_16bit_8x4()
[all …]
Dadaptive_quantize_sse2.c81 zbin = _mm_unpackhi_epi64(zbin, zbin); // Switch DC to AC in aom_quantize_b_adaptive_sse2()
94 round = _mm_unpackhi_epi64(round, round); in aom_quantize_b_adaptive_sse2()
95 quant = _mm_unpackhi_epi64(quant, quant); in aom_quantize_b_adaptive_sse2()
96 shift = _mm_unpackhi_epi64(shift, shift); in aom_quantize_b_adaptive_sse2()
97 dequant = _mm_unpackhi_epi64(dequant, dequant); in aom_quantize_b_adaptive_sse2()
101 round = _mm_unpackhi_epi64(round, round); in aom_quantize_b_adaptive_sse2()
102 quant = _mm_unpackhi_epi64(quant, quant); in aom_quantize_b_adaptive_sse2()
103 shift = _mm_unpackhi_epi64(shift, shift); in aom_quantize_b_adaptive_sse2()
119 dequant = _mm_unpackhi_epi64(dequant, dequant); in aom_quantize_b_adaptive_sse2()
289 zbin = _mm_unpackhi_epi64(zbin, zbin); // Switch DC to AC in aom_quantize_b_32x32_adaptive_sse2()
[all …]
Dlpf_common_sse2.h40 *d1 = _mm_unpackhi_epi64(ww0, in highbd_transpose6x6_sse2()
51 *d3 = _mm_unpackhi_epi64(ww0, _mm_srli_si128(w2, 4)); // 03 13 23 33 43 53 in highbd_transpose6x6_sse2()
55 *d5 = _mm_unpackhi_epi64(ww0, in highbd_transpose6x6_sse2()
73 *d1 = _mm_unpackhi_epi64(ww0, zero); // 01 11 21 31 xx xx xx xx in highbd_transpose4x8_8x4_low_sse2()
75 *d3 = _mm_unpackhi_epi64(ww1, zero); // 03 13 23 33 xx xx xx xx in highbd_transpose4x8_8x4_low_sse2()
92 *d5 = _mm_unpackhi_epi64(ww2, zero); // 05 15 25 35 xx xx xx xx in highbd_transpose4x8_8x4_high_sse2()
94 *d7 = _mm_unpackhi_epi64(ww3, zero); // 07 17 27 37 xx xx xx xx in highbd_transpose4x8_8x4_high_sse2()
148 *d1 = _mm_unpackhi_epi64(ww0, ww1); // 01 11 21 31 41 51 61 71 in highbd_transpose8x8_low_sse2()
154 *d3 = _mm_unpackhi_epi64(ww0, ww1); // 03 13 23 33 43 53 63 73 in highbd_transpose8x8_low_sse2()
181 *d5 = _mm_unpackhi_epi64(ww0, ww1); // 05 15 25 35 45 55 65 75 in highbd_transpose8x8_high_sse2()
[all …]
Dquantize_ssse3.c104 zbin = _mm_unpackhi_epi64(zbin, zbin); in aom_quantize_b_64x64_ssse3()
116 round = _mm_unpackhi_epi64(round, round); in aom_quantize_b_64x64_ssse3()
117 quant = _mm_unpackhi_epi64(quant, quant); in aom_quantize_b_64x64_ssse3()
118 shift = _mm_unpackhi_epi64(shift, shift); in aom_quantize_b_64x64_ssse3()
119 dequant = _mm_unpackhi_epi64(dequant, dequant); in aom_quantize_b_64x64_ssse3()
122 round = _mm_unpackhi_epi64(round, round); in aom_quantize_b_64x64_ssse3()
123 quant = _mm_unpackhi_epi64(quant, quant); in aom_quantize_b_64x64_ssse3()
124 shift = _mm_unpackhi_epi64(shift, shift); in aom_quantize_b_64x64_ssse3()
139 dequant = _mm_unpackhi_epi64(dequant, dequant); in aom_quantize_b_64x64_ssse3()
Dquantize_sse2.c54 zbin = _mm_unpackhi_epi64(zbin, zbin); // Switch DC to AC in aom_quantize_b_sse2()
59 round = _mm_unpackhi_epi64(round, round); in aom_quantize_b_sse2()
60 quant = _mm_unpackhi_epi64(quant, quant); in aom_quantize_b_sse2()
61 shift = _mm_unpackhi_epi64(shift, shift); in aom_quantize_b_sse2()
77 dequant = _mm_unpackhi_epi64(dequant, dequant); in aom_quantize_b_sse2()
/external/libvpx/libvpx/vpx_dsp/x86/
Dtranspose_sse2.h86 out[1] = _mm_unpackhi_epi64(c0, c0); in transpose_8bit_8x8()
88 out[3] = _mm_unpackhi_epi64(c1, c1); in transpose_8bit_8x8()
90 out[5] = _mm_unpackhi_epi64(c2, c2); in transpose_8bit_8x8()
92 out[7] = _mm_unpackhi_epi64(c3, c3); in transpose_8bit_8x8()
152 out[1] = _mm_unpackhi_epi64(b0, b1); in transpose_16bit_4x8()
154 out[3] = _mm_unpackhi_epi64(b2, b3); in transpose_16bit_4x8()
214 out[1] = _mm_unpackhi_epi64(b0, b1); in transpose_16bit_8x8()
216 out[3] = _mm_unpackhi_epi64(b4, b5); in transpose_16bit_8x8()
218 out[5] = _mm_unpackhi_epi64(b2, b3); in transpose_16bit_8x8()
220 out[7] = _mm_unpackhi_epi64(b6, b7); in transpose_16bit_8x8()
[all …]
Dquantize_avx.c58 zbin = _mm_unpackhi_epi64(zbin, zbin); // Switch DC to AC in vpx_quantize_b_avx()
72 round = _mm_unpackhi_epi64(round, round); in vpx_quantize_b_avx()
73 quant = _mm_unpackhi_epi64(quant, quant); in vpx_quantize_b_avx()
74 shift = _mm_unpackhi_epi64(shift, shift); in vpx_quantize_b_avx()
75 dequant = _mm_unpackhi_epi64(dequant, dequant); in vpx_quantize_b_avx()
78 round = _mm_unpackhi_epi64(round, round); in vpx_quantize_b_avx()
79 quant = _mm_unpackhi_epi64(quant, quant); in vpx_quantize_b_avx()
80 shift = _mm_unpackhi_epi64(shift, shift); in vpx_quantize_b_avx()
95 dequant = _mm_unpackhi_epi64(dequant, dequant); in vpx_quantize_b_avx()
199 zbin = _mm_unpackhi_epi64(zbin, zbin); // Switch DC to AC. in vpx_quantize_b_32x32_avx()
[all …]
Dquantize_ssse3.c51 zbin = _mm_unpackhi_epi64(zbin, zbin); // Switch DC to AC in vpx_quantize_b_ssse3()
55 round = _mm_unpackhi_epi64(round, round); in vpx_quantize_b_ssse3()
56 quant = _mm_unpackhi_epi64(quant, quant); in vpx_quantize_b_ssse3()
57 shift = _mm_unpackhi_epi64(shift, shift); in vpx_quantize_b_ssse3()
72 dequant = _mm_unpackhi_epi64(dequant, dequant); in vpx_quantize_b_ssse3()
167 zbin = _mm_unpackhi_epi64(zbin, zbin); // Switch DC to AC. in vpx_quantize_b_32x32_ssse3()
183 round = _mm_unpackhi_epi64(round, round); in vpx_quantize_b_32x32_ssse3()
184 quant = _mm_unpackhi_epi64(quant, quant); in vpx_quantize_b_32x32_ssse3()
185 shift = _mm_unpackhi_epi64(shift, shift); in vpx_quantize_b_32x32_ssse3()
186 dequant = _mm_unpackhi_epi64(dequant, dequant); in vpx_quantize_b_32x32_ssse3()
[all …]
Dquantize_sse2.c55 zbin = _mm_unpackhi_epi64(zbin, zbin); // Switch DC to AC in vpx_quantize_b_sse2()
60 round = _mm_unpackhi_epi64(round, round); in vpx_quantize_b_sse2()
61 quant = _mm_unpackhi_epi64(quant, quant); in vpx_quantize_b_sse2()
62 shift = _mm_unpackhi_epi64(shift, shift); in vpx_quantize_b_sse2()
78 dequant = _mm_unpackhi_epi64(dequant, dequant); in vpx_quantize_b_sse2()
Dinv_txfm_sse2.h55 out[1] = _mm_unpackhi_epi64(tr1_0, tr1_1); in idct8x8_12_transpose_16bit_4x8()
57 out[3] = _mm_unpackhi_epi64(tr1_2, tr1_3); in idct8x8_12_transpose_16bit_4x8()
318 step2[6] = _mm_unpackhi_epi64(step2[5], zero); // step2 6 in idct8x8_12_add_kernel_sse2()
326 step1[2] = _mm_unpackhi_epi64(tmp[1], tmp[0]); // step1 2&1 in idct8x8_12_add_kernel_sse2()
459 step1[13] = _mm_unpackhi_epi64(step2[11], zero); in idct16x16_10_pass1()
460 step1[14] = _mm_unpackhi_epi64(step2[8], zero); in idct16x16_10_pass1()
477 step2[6] = _mm_unpackhi_epi64(step1[4], zero); in idct16x16_10_pass1()
489 step1[12] = _mm_unpackhi_epi64(step1[11], zero); in idct16x16_10_pass1()
490 step1[13] = _mm_unpackhi_epi64(step1[10], zero); in idct16x16_10_pass1()
491 step1[14] = _mm_unpackhi_epi64(step1[9], zero); in idct16x16_10_pass1()
[all …]
Dinv_txfm_ssse3.h44 tmp[1] = _mm_unpackhi_epi64(io[0], io[0]); in idct8x8_12_add_kernel_ssse3()
46 tmp[3] = _mm_unpackhi_epi64(io[1], io[1]); in idct8x8_12_add_kernel_ssse3()
55 step2[6] = _mm_unpackhi_epi64(step2[5], step2[5]); // step2 6 in idct8x8_12_add_kernel_ssse3()
62 step1[2] = _mm_unpackhi_epi64(tmp[1], tmp[0]); // step1 2&1 in idct8x8_12_add_kernel_ssse3()
/external/epid-sdk/ext/ipp/sources/ippcp/
Dpcpsms4ecby8cn.h107 K3 = _mm_unpackhi_epi64(K1, K3); \
108 K1 = _mm_unpackhi_epi64(T, K0); \
117 K2 = _mm_unpackhi_epi64(K1, T); \
120 K0 = _mm_unpackhi_epi64(K3, K0); \
/external/libavc/common/x86/
Dih264_ihadamard_scaling_sse42.c130 src_r1 = _mm_unpackhi_epi64(temp0, temp2); //a1 b1 c1 d1 in ih264_ihadamard_scaling_4x4_sse42()
132 src_r3 = _mm_unpackhi_epi64(temp1, temp3); //a3 b3 c3 d3 in ih264_ihadamard_scaling_4x4_sse42()
159 src_r1 = _mm_unpackhi_epi64(temp0, temp2); //b0 b1 b2 b3 in ih264_ihadamard_scaling_4x4_sse42()
161 src_r3 = _mm_unpackhi_epi64(temp1, temp3); //d0 d1 d2 d3 in ih264_ihadamard_scaling_4x4_sse42()
229 …plane_1 = _mm_unpackhi_epi64(temp0, temp1); //b0+b1+b2+b3 b0+b1-b2-b3 b0-b1+b2-b3 b0-b1-b2… in ih264_ihadamard_scaling_2x2_uv_sse42()
Dih264_ihadamard_scaling_ssse3.c132 src_r1 = _mm_unpackhi_epi64(temp0, temp2); //a1 b1 c1 d1 in ih264_ihadamard_scaling_4x4_ssse3()
134 src_r3 = _mm_unpackhi_epi64(temp1, temp3); //a3 b3 c3 d3 in ih264_ihadamard_scaling_4x4_ssse3()
161 src_r1 = _mm_unpackhi_epi64(temp0, temp2); //b0 b1 b2 b3 in ih264_ihadamard_scaling_4x4_ssse3()
163 src_r3 = _mm_unpackhi_epi64(temp1, temp3); //d0 d1 d2 d3 in ih264_ihadamard_scaling_4x4_ssse3()
Dih264_resi_trans_quant_sse42.c171 src_r1 = _mm_unpackhi_epi64(temp1, zero_8x16b); //a1 b1 c1 d1 in ih264_resi_trans_quant_4x4_sse42()
173 src_r3 = _mm_unpackhi_epi64(temp3, zero_8x16b); //a3 b3 c3 d3 in ih264_resi_trans_quant_4x4_sse42()
209 src_r1 = _mm_unpackhi_epi64(temp1, zero_8x16b); //b0 b1 b2 b3 in ih264_resi_trans_quant_4x4_sse42()
211 src_r3 = _mm_unpackhi_epi64(temp3, zero_8x16b); //d0 d1 d2 d3 in ih264_resi_trans_quant_4x4_sse42()
454 src_r1 = _mm_unpackhi_epi64(temp1, zero_8x16b); //a1 b1 c1 d1 in ih264_resi_trans_quant_chroma_4x4_sse42()
456 src_r3 = _mm_unpackhi_epi64(temp3, zero_8x16b); //a3 b3 c3 d3 in ih264_resi_trans_quant_chroma_4x4_sse42()
492 src_r1 = _mm_unpackhi_epi64(temp1, zero_8x16b); //b0 b1 b2 b3 in ih264_resi_trans_quant_chroma_4x4_sse42()
494 src_r3 = _mm_unpackhi_epi64(temp3, zero_8x16b); //d0 d1 d2 d3 in ih264_resi_trans_quant_chroma_4x4_sse42()
711 src_r1 = _mm_unpackhi_epi64(temp0, temp2); //a1 b1 c1 d1 in ih264_hadamard_quant_4x4_sse42()
713 src_r3 = _mm_unpackhi_epi64(temp1, temp3); //a3 b3 c3 d3 in ih264_hadamard_quant_4x4_sse42()
[all …]
Dih264_iquant_itrans_recon_sse42.c188 resq_r1 = _mm_unpackhi_epi64(temp1, temp3); //a1 b1 c1 d1 in ih264_iquant_itrans_recon_4x4_sse42()
190 resq_r3 = _mm_unpackhi_epi64(temp2, temp4); //a3 b3 c3 d3 in ih264_iquant_itrans_recon_4x4_sse42()
224 resq_r1 = _mm_unpackhi_epi64(temp1, temp3); //b0 b1 b2 b3 in ih264_iquant_itrans_recon_4x4_sse42()
226 resq_r3 = _mm_unpackhi_epi64(temp2, temp4); //d0 d1 d2 d3 in ih264_iquant_itrans_recon_4x4_sse42()
438 resq_r1 = _mm_unpackhi_epi64(temp1, temp3); //a1 b1 c1 d1 in ih264_iquant_itrans_recon_chroma_4x4_sse42()
440 resq_r3 = _mm_unpackhi_epi64(temp2, temp4); //a3 b3 c3 d3 in ih264_iquant_itrans_recon_chroma_4x4_sse42()
474 resq_r1 = _mm_unpackhi_epi64(temp1, temp3); //b0 b1 b2 b3 in ih264_iquant_itrans_recon_chroma_4x4_sse42()
476 resq_r3 = _mm_unpackhi_epi64(temp2, temp4); //d0 d1 d2 d3 in ih264_iquant_itrans_recon_chroma_4x4_sse42()
/external/libopus/celt/x86/
Dpitch_sse4_1.c98 acc1 = _mm_add_epi32(acc1, _mm_unpackhi_epi64(acc1, acc1)); in celt_inner_prod_sse4_1()
141 sum0 = _mm_add_epi32(sum0, _mm_unpackhi_epi64( sum0, sum0)); in xcorr_kernel_sse4_1()
144 sum1 = _mm_add_epi32(sum1, _mm_unpackhi_epi64( sum1, sum1)); in xcorr_kernel_sse4_1()
147 sum2 = _mm_add_epi32(sum2, _mm_unpackhi_epi64( sum2, sum2)); in xcorr_kernel_sse4_1()
150 sum3 = _mm_add_epi32(sum3, _mm_unpackhi_epi64( sum3, sum3)); in xcorr_kernel_sse4_1()
/external/libhevc/decoder/x86/
Dihevcd_fmt_conv_ssse3_intr.c154 src_v_8x16b = _mm_unpackhi_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
167 src_v_8x16b = _mm_unpackhi_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
180 src_v_8x16b = _mm_unpackhi_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
193 src_v_8x16b = _mm_unpackhi_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
229 src_v_8x16b = _mm_unpackhi_epi64(temp0_8x16b, temp1_8x16b); in ihevcd_fmt_conv_420sp_to_420p_ssse3()
/external/webp/src/dsp/
Dcommon_sse2.h94 *out1 = _mm_unpackhi_epi64(transpose1_0, transpose1_1); in VP8Transpose_2_4x4_16b()
96 *out3 = _mm_unpackhi_epi64(transpose1_2, transpose1_3); in VP8Transpose_2_4x4_16b()
182 *in0 = _mm_unpackhi_epi64(C1, C3); in VP8L32bToPlanar_SSE2()
184 *in2 = _mm_unpackhi_epi64(C0, C2); in VP8L32bToPlanar_SSE2()
/external/mesa3d/src/gallium/auxiliary/util/
Du_sse.h264 *p = _mm_unpackhi_epi64(t0, t1); in transpose4_epi32()
266 *r = _mm_unpackhi_epi64(t2, t3); in transpose4_epi32()
290 *p = _mm_unpackhi_epi64(t0, t1); in transpose2_64_2_32()
292 *r = _mm_unpackhi_epi64(t2, t3); in transpose2_64_2_32()
/external/libaom/libaom/av1/common/x86/
Dhighbd_wiener_convolve_ssse3.c59 const __m128i coeff_23 = _mm_unpackhi_epi64(tmp_0, tmp_0); in av1_highbd_wiener_convolve_add_src_ssse3()
63 const __m128i coeff_67 = _mm_unpackhi_epi64(tmp_1, tmp_1); in av1_highbd_wiener_convolve_add_src_ssse3()
127 const __m128i coeff_23 = _mm_unpackhi_epi64(tmp_0, tmp_0); in av1_highbd_wiener_convolve_add_src_ssse3()
131 const __m128i coeff_67 = _mm_unpackhi_epi64(tmp_1, tmp_1); in av1_highbd_wiener_convolve_add_src_ssse3()
Dwiener_convolve_sse2.c58 const __m128i coeff_23 = _mm_unpackhi_epi64(tmp_0, tmp_0); in av1_wiener_convolve_add_src_sse2()
62 const __m128i coeff_67 = _mm_unpackhi_epi64(tmp_1, tmp_1); in av1_wiener_convolve_add_src_sse2()
125 const __m128i coeff_23 = _mm_unpackhi_epi64(tmp_0, tmp_0); in av1_wiener_convolve_add_src_sse2()
129 const __m128i coeff_67 = _mm_unpackhi_epi64(tmp_1, tmp_1); in av1_wiener_convolve_add_src_sse2()

12345