Home
last modified time | relevance | path

Searched refs:_mm256_unpackhi_epi32 (Results 1 – 22 of 22) sorted by relevance

/external/libaom/libaom/aom_dsp/x86/
Dcommon_avx2.h58 __m256i tr1_1 = _mm256_unpackhi_epi32(tr0_0, tr0_2); in mm256_transpose_16x16()
60 __m256i tr1_3 = _mm256_unpackhi_epi32(tr0_1, tr0_3); in mm256_transpose_16x16()
62 __m256i tr1_5 = _mm256_unpackhi_epi32(tr0_4, tr0_6); in mm256_transpose_16x16()
64 __m256i tr1_7 = _mm256_unpackhi_epi32(tr0_5, tr0_7); in mm256_transpose_16x16()
67 __m256i tr1_9 = _mm256_unpackhi_epi32(tr0_8, tr0_a); in mm256_transpose_16x16()
69 __m256i tr1_b = _mm256_unpackhi_epi32(tr0_9, tr0_b); in mm256_transpose_16x16()
71 __m256i tr1_d = _mm256_unpackhi_epi32(tr0_c, tr0_e); in mm256_transpose_16x16()
73 __m256i tr1_f = _mm256_unpackhi_epi32(tr0_d, tr0_f); in mm256_transpose_16x16()
Dtxfm_common_avx2.h143 b[i / 2 + 8] = _mm256_unpackhi_epi32(a[i], a[i + 1]); in transpose_16bit_16x16_avx2()
186 const __m256i b4 = _mm256_unpackhi_epi32(a0, a1); in transpose_16bit_16x8_avx2()
187 const __m256i b5 = _mm256_unpackhi_epi32(a2, a3); in transpose_16bit_16x8_avx2()
188 const __m256i b6 = _mm256_unpackhi_epi32(a4, a5); in transpose_16bit_16x8_avx2()
189 const __m256i b7 = _mm256_unpackhi_epi32(a6, a7); in transpose_16bit_16x8_avx2()
Davg_intrin_avx2.c68 b2 = _mm256_unpackhi_epi32(a0, a1); in hadamard_col8x2_avx2()
69 b3 = _mm256_unpackhi_epi32(a4, a5); in hadamard_col8x2_avx2()
72 b6 = _mm256_unpackhi_epi32(a2, a3); in hadamard_col8x2_avx2()
73 b7 = _mm256_unpackhi_epi32(a6, a7); in hadamard_col8x2_avx2()
Dhighbd_variance_avx2.c46 __m256i v_d_h = _mm256_unpackhi_epi32(v_sum0, v_sse_d); in aom_highbd_calc8x8var_avx2()
74 __m256i v_d_h = _mm256_unpackhi_epi32(v_sum0, v_sse_d); in aom_highbd_calc16x16var_avx2()
Dintrapred_avx2.c125 ww0 = _mm256_unpackhi_epi32(w0, w1); // 02 12 22 32 03 13 23 33 in highbd_transpose4x16_avx2()
126 ww1 = _mm256_unpackhi_epi32(w2, w3); // 42 52 62 72 43 53 63 73 in highbd_transpose4x16_avx2()
146 ww0 = _mm256_unpackhi_epi32(w0, w1); // 02 12 22 32 03 13 23 33 in highbd_transpose8x16_16x8_avx2()
147 ww1 = _mm256_unpackhi_epi32(w2, w3); // 42 52 62 72 43 53 63 73 in highbd_transpose8x16_16x8_avx2()
163 ww0 = _mm256_unpackhi_epi32(w0, w1); // 06 16 26 36 07 17 27 37 in highbd_transpose8x16_16x8_avx2()
164 ww1 = _mm256_unpackhi_epi32(w2, w3); // 46 56 66 76 47 57 67 77 in highbd_transpose8x16_16x8_avx2()
184 ww0 = _mm256_unpackhi_epi32(w0, w1); // in highbd_transpose16x16_avx2()
185 ww1 = _mm256_unpackhi_epi32(w2, w3); // in highbd_transpose16x16_avx2()
201 ww0 = _mm256_unpackhi_epi32(w0, w1); // in highbd_transpose16x16_avx2()
202 ww1 = _mm256_unpackhi_epi32(w2, w3); // in highbd_transpose16x16_avx2()
[all …]
Dsse_avx2.c39 const __m256i sum1_4x64 = _mm256_unpackhi_epi32(*sum_all, zero); in summary_all_avx2()
/external/libvpx/libvpx/vpx_dsp/x86/
Dfwd_dct32x32_impl_avx2.h1554 u[1] = _mm256_unpackhi_epi32(lstep3[12], lstep3[10]); in FDCT32x32_2D_AVX2()
1556 u[3] = _mm256_unpackhi_epi32(lstep3[13], lstep3[11]); in FDCT32x32_2D_AVX2()
1593 u[1] = _mm256_unpackhi_epi32(lstep3[36], lstep3[58]); in FDCT32x32_2D_AVX2()
1595 u[3] = _mm256_unpackhi_epi32(lstep3[37], lstep3[59]); in FDCT32x32_2D_AVX2()
1597 u[5] = _mm256_unpackhi_epi32(lstep3[38], lstep3[56]); in FDCT32x32_2D_AVX2()
1599 u[7] = _mm256_unpackhi_epi32(lstep3[39], lstep3[57]); in FDCT32x32_2D_AVX2()
1601 u[9] = _mm256_unpackhi_epi32(lstep3[40], lstep3[54]); in FDCT32x32_2D_AVX2()
1603 u[11] = _mm256_unpackhi_epi32(lstep3[41], lstep3[55]); in FDCT32x32_2D_AVX2()
1605 u[13] = _mm256_unpackhi_epi32(lstep3[42], lstep3[52]); in FDCT32x32_2D_AVX2()
1607 u[15] = _mm256_unpackhi_epi32(lstep3[43], lstep3[53]); in FDCT32x32_2D_AVX2()
[all …]
Davg_intrin_avx2.c59 a2 = _mm256_unpackhi_epi32(b0, b1); in highbd_hadamard_col8_avx2()
60 a3 = _mm256_unpackhi_epi32(b2, b3); in highbd_hadamard_col8_avx2()
63 a6 = _mm256_unpackhi_epi32(b4, b5); in highbd_hadamard_col8_avx2()
64 a7 = _mm256_unpackhi_epi32(b6, b7); in highbd_hadamard_col8_avx2()
270 b2 = _mm256_unpackhi_epi32(a0, a1); in hadamard_col8x2_avx2()
271 b3 = _mm256_unpackhi_epi32(a4, a5); in hadamard_col8x2_avx2()
274 b6 = _mm256_unpackhi_epi32(a2, a3); in hadamard_col8x2_avx2()
275 b7 = _mm256_unpackhi_epi32(a6, a7); in hadamard_col8x2_avx2()
/external/libvpx/libvpx/vp9/encoder/x86/
Dvp9_error_avx2.c77 exp_dqcoeff_hi = _mm256_unpackhi_epi32(dqcoeff_0, zero); in vp9_block_error_avx2()
80 exp_coeff_hi = _mm256_unpackhi_epi32(coeff_0, zero); in vp9_block_error_avx2()
141 const __m256i exp_error_hi = _mm256_unpackhi_epi32(error, zero); in vp9_block_error_fp_avx2()
/external/libaom/libaom/av1/encoder/x86/
Derror_intrin_avx2.c58 exp_dqcoeff_hi = _mm256_unpackhi_epi32(dqcoeff_reg, zero_reg); in av1_block_error_avx2()
61 exp_coeff_hi = _mm256_unpackhi_epi32(coeff_reg, zero_reg); in av1_block_error_avx2()
Dwedge_utils_avx2.c136 _mm256_unpackhi_epi32(v_acc0_d, v_sign_d)); in av1_wedge_sign_from_residuals_avx2()
Dav1_fwd_txfm2d_avx2.c1436 __m256i temp1 = _mm256_unpackhi_epi32(inputA[0], inputA[2]); in transpose_32_8x8_avx2()
1438 __m256i temp3 = _mm256_unpackhi_epi32(inputA[1], inputA[3]); in transpose_32_8x8_avx2()
1440 __m256i temp5 = _mm256_unpackhi_epi32(inputA[4], inputA[6]); in transpose_32_8x8_avx2()
1442 __m256i temp7 = _mm256_unpackhi_epi32(inputA[5], inputA[7]); in transpose_32_8x8_avx2()
1445 __m256i t1 = _mm256_unpackhi_epi32(temp0, temp2); in transpose_32_8x8_avx2()
1447 __m256i t3 = _mm256_unpackhi_epi32(temp1, temp3); in transpose_32_8x8_avx2()
1449 __m256i t5 = _mm256_unpackhi_epi32(temp4, temp6); in transpose_32_8x8_avx2()
1451 __m256i t7 = _mm256_unpackhi_epi32(temp5, temp7); in transpose_32_8x8_avx2()
Dhighbd_fwd_txfm_avx2.c152 u1 = _mm256_unpackhi_epi32(in[0 * instride], in[1 * instride]); in av1_fwd_txfm_transpose_8x8_avx2()
155 u3 = _mm256_unpackhi_epi32(in[2 * instride], in[3 * instride]); in av1_fwd_txfm_transpose_8x8_avx2()
158 u5 = _mm256_unpackhi_epi32(in[4 * instride], in[5 * instride]); in av1_fwd_txfm_transpose_8x8_avx2()
161 u7 = _mm256_unpackhi_epi32(in[6 * instride], in[7 * instride]); in av1_fwd_txfm_transpose_8x8_avx2()
/external/eigen/Eigen/src/Core/arch/CUDA/
DPacketMathHalf.h569 __m256i abcd_47 = _mm256_unpackhi_epi32(ab_07, cd_07);
571 __m256i efgh_47 = _mm256_unpackhi_epi32(ef_07, gh_07);
573 __m256i ijkl_47 = _mm256_unpackhi_epi32(ij_07, kl_07);
575 __m256i mnop_47 = _mm256_unpackhi_epi32(mn_07, op_07);
578 __m256i abcd_cf = _mm256_unpackhi_epi32(ab_8f, cd_8f);
580 __m256i efgh_cf = _mm256_unpackhi_epi32(ef_8f, gh_8f);
582 __m256i ijkl_cf = _mm256_unpackhi_epi32(ij_8f, kl_8f);
584 __m256i mnop_cf = _mm256_unpackhi_epi32(mn_8f, op_8f);
/external/libaom/libaom/av1/common/x86/
Dhighbd_wiener_convolve_avx2.c226 const __m256i res_hi = _mm256_unpackhi_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_avx2()
Dwiener_convolve_avx2.c232 const __m256i res_hi = _mm256_unpackhi_epi32(res_even, res_odd); in av1_wiener_convolve_add_src_avx2()
Dhighbd_inv_txfm_avx2.c124 u1 = _mm256_unpackhi_epi32(in[0], in[1]); in transpose_8x8_avx2()
127 u3 = _mm256_unpackhi_epi32(in[2], in[3]); in transpose_8x8_avx2()
130 u5 = _mm256_unpackhi_epi32(in[4], in[5]); in transpose_8x8_avx2()
133 u7 = _mm256_unpackhi_epi32(in[6], in[7]); in transpose_8x8_avx2()
161 u1 = _mm256_unpackhi_epi32(in[7], in[6]); in transpose_8x8_flip_avx2()
164 u3 = _mm256_unpackhi_epi32(in[5], in[4]); in transpose_8x8_flip_avx2()
167 u5 = _mm256_unpackhi_epi32(in[3], in[2]); in transpose_8x8_flip_avx2()
170 u7 = _mm256_unpackhi_epi32(in[1], in[0]); in transpose_8x8_flip_avx2()
Dhighbd_jnt_convolve_avx2.c585 __m256i res2 = _mm256_unpackhi_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_x_avx2()
/external/libaom/libaom/aom_dsp/simd/
Dv256_intrinsics_x86.h172 return _mm256_unpackhi_epi32( in v256_ziphi_32()
739 return v256_add_64(s, v256_add_64(_mm256_unpackhi_epi32(d, v256_zero()), in v256_ssd_s16()
/external/clang/test/CodeGen/
Davx2-builtins.c1189 return _mm256_unpackhi_epi32(a, b); in test_mm256_unpackhi_epi32()
/external/clang/lib/Headers/
Davx2intrin.h791 _mm256_unpackhi_epi32(__m256i __a, __m256i __b) in _mm256_unpackhi_epi32() function
Davx512vlintrin.h6879 (__v8si)_mm256_unpackhi_epi32(__A, __B), in _mm256_mask_unpackhi_epi32()
6887 (__v8si)_mm256_unpackhi_epi32(__A, __B), in _mm256_maskz_unpackhi_epi32()