/external/libavc/common/x86/ |
D | ih264_iquant_itrans_recon_ssse3.c | 140 …temp4 = _mm_unpacklo_epi16(temp0, zero_8x16b); // b00*q00 0 b01*q01 0 b02*q02 0 b03*q03 0 -- 16 bi… in ih264_iquant_itrans_recon_4x4_ssse3() 142 …temp6 = _mm_unpacklo_epi16(temp1, zero_8x16b); // b00*q00 0 b01*q01 0 b02*q02 0 b03*q03 0 -- 16 bi… in ih264_iquant_itrans_recon_4x4_ssse3() 145 src_r0 = _mm_unpacklo_epi16(src_r0_r1, zero_8x16b); // a00 0 a01 0 a02 0 a03 0 -- 16 bit long in ih264_iquant_itrans_recon_4x4_ssse3() 147 src_r2 = _mm_unpacklo_epi16(src_r2_r3, zero_8x16b); // a20 0 a21 0 a22 0 a23 0 -- 16 bit long in ih264_iquant_itrans_recon_4x4_ssse3() 249 pred_r0 = _mm_unpacklo_epi16(pred_r0, zero_8x16b); //p00 p01 p02 p03 -- 32 bits sign extended in ih264_iquant_itrans_recon_4x4_ssse3() 250 pred_r1 = _mm_unpacklo_epi16(pred_r1, zero_8x16b); //p10 p11 p12 p13 -- 32 bits sign extended in ih264_iquant_itrans_recon_4x4_ssse3() 251 pred_r2 = _mm_unpacklo_epi16(pred_r2, zero_8x16b); //p20 p21 p22 p23 -- 32 bits sign extended in ih264_iquant_itrans_recon_4x4_ssse3() 252 pred_r3 = _mm_unpacklo_epi16(pred_r3, zero_8x16b); //p30 p31 p32 p33 -- 32 bits sign extended in ih264_iquant_itrans_recon_4x4_ssse3() 415 src_r0_1 = _mm_unpacklo_epi16(src_r0, zero_8x16b); //a00 0 a01 0 a02 0 a03 0 -- 16 bit long in ih264_iquant_itrans_recon_8x8_ssse3() 418 …scalemat_r0_1 = _mm_unpacklo_epi16(temp10, zero_8x16b); // b00*q0 0 b01*q1 0 b02*q2 0 b03*q3 0 -- … in ih264_iquant_itrans_recon_8x8_ssse3() [all …]
|
D | ih264_deblk_chroma_ssse3.c | 124 temp1 = _mm_unpacklo_epi16(linea, lineb); in ih264_deblk_chroma_vert_bs4_ssse3() 125 temp2 = _mm_unpacklo_epi16(linec, lined); in ih264_deblk_chroma_vert_bs4_ssse3() 126 temp3 = _mm_unpacklo_epi16(linee, linef); in ih264_deblk_chroma_vert_bs4_ssse3() 127 temp4 = _mm_unpacklo_epi16(lineg, lineh); in ih264_deblk_chroma_vert_bs4_ssse3() 218 temp1 = _mm_unpacklo_epi16(p1_uv_16x8, p0_uv_16x8); in ih264_deblk_chroma_vert_bs4_ssse3() 220 temp3 = _mm_unpacklo_epi16(q0_uv_16x8, q1_uv_16x8); in ih264_deblk_chroma_vert_bs4_ssse3() 473 temp1 = _mm_unpacklo_epi16(linea, lineb); in ih264_deblk_chroma_vert_bslt4_ssse3() 474 temp2 = _mm_unpacklo_epi16(linec, lined); in ih264_deblk_chroma_vert_bslt4_ssse3() 475 temp3 = _mm_unpacklo_epi16(linee, linef); in ih264_deblk_chroma_vert_bslt4_ssse3() 476 temp4 = _mm_unpacklo_epi16(lineg, lineh); in ih264_deblk_chroma_vert_bslt4_ssse3() [all …]
|
D | ih264_deblk_luma_ssse3.c | 127 line1 = _mm_unpacklo_epi16(temp1, temp2); in ih264_deblk_luma_vert_bs4_ssse3() 129 line3 = _mm_unpacklo_epi16(temp3, temp4); in ih264_deblk_luma_vert_bs4_ssse3() 151 line1 = _mm_unpacklo_epi16(temp1, temp2); in ih264_deblk_luma_vert_bs4_ssse3() 153 line3 = _mm_unpacklo_epi16(temp3, temp4); in ih264_deblk_luma_vert_bs4_ssse3() 428 p3_8x16 = _mm_unpacklo_epi16(temp1, temp2); in ih264_deblk_luma_vert_bs4_ssse3() 430 q2_8x16 = _mm_unpacklo_epi16(temp3, temp4); in ih264_deblk_luma_vert_bs4_ssse3() 456 p3_8x16 = _mm_unpacklo_epi16(temp1, temp2); in ih264_deblk_luma_vert_bs4_ssse3() 458 q2_8x16 = _mm_unpacklo_epi16(temp3, temp4); in ih264_deblk_luma_vert_bs4_ssse3() 881 int1 = _mm_unpacklo_epi16(linea, lineb); in ih264_deblk_luma_vert_bslt4_ssse3() 884 int2 = _mm_unpacklo_epi16(linec, lined); in ih264_deblk_luma_vert_bslt4_ssse3() [all …]
|
D | ih264_inter_pred_filters_ssse3.c | 894 src_r0_8x16b = _mm_unpacklo_epi16(src_r0_8x16b, src_r1_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 895 src_t1_8x16b = _mm_unpacklo_epi16(src_r2_8x16b, src_r3_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 896 src_t2_8x16b = _mm_unpacklo_epi16(src_r4_8x16b, src_r5_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 908 src_r1_8x16b = _mm_unpacklo_epi16(src_r1_8x16b, src_r2_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 909 src_t1_8x16b = _mm_unpacklo_epi16(src_r3_8x16b, src_r4_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 910 src_t2_8x16b = _mm_unpacklo_epi16(src_r5_8x16b, src_r6_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 1087 src_r0r1_8x16b = _mm_unpacklo_epi16(src_r0_8x16b, src_r1_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 1088 src_r2r3_8x16b = _mm_unpacklo_epi16(src_r2_8x16b, src_r3_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 1089 src_r4r5_8x16b = _mm_unpacklo_epi16(src_r4_8x16b, src_r5_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 1118 src_r0r1_8x16b = _mm_unpacklo_epi16(src_r1_8x16b, src_r2_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() [all …]
|
D | ih264_iquant_itrans_recon_sse42.c | 139 …temp4 = _mm_unpacklo_epi16(temp0, zero_8x16b); // b00*q00 0 b01*q01 0 b02*q02 0 b03*q03 0 -- 16 bi… in ih264_iquant_itrans_recon_4x4_sse42() 141 …temp6 = _mm_unpacklo_epi16(temp1, zero_8x16b); // b00*q00 0 b01*q01 0 b02*q02 0 b03*q03 0 -- 16 bi… in ih264_iquant_itrans_recon_4x4_sse42() 144 src_r0 = _mm_unpacklo_epi16(src_r0_r1, zero_8x16b); // a00 0 a01 0 a02 0 a03 0 -- 16 bit long in ih264_iquant_itrans_recon_4x4_sse42() 146 src_r2 = _mm_unpacklo_epi16(src_r2_r3, zero_8x16b); // a20 0 a21 0 a22 0 a23 0 -- 16 bit long in ih264_iquant_itrans_recon_4x4_sse42() 390 …temp4 = _mm_unpacklo_epi16(temp0, zero_8x16b); // b00*q00 0 b01*q01 0 b02*q02 0 b03*q03 0 -- 16 bi… in ih264_iquant_itrans_recon_chroma_4x4_sse42() 392 …temp6 = _mm_unpacklo_epi16(temp1, zero_8x16b); // b00*q00 0 b01*q01 0 b02*q02 0 b03*q03 0 -- 16 bi… in ih264_iquant_itrans_recon_chroma_4x4_sse42() 395 src_r0 = _mm_unpacklo_epi16(src_r0_r1, zero_8x16b); // a00 0 a01 0 a02 0 a03 0 -- 16 bit long in ih264_iquant_itrans_recon_chroma_4x4_sse42() 397 src_r2 = _mm_unpacklo_epi16(src_r2_r3, zero_8x16b); // a20 0 a21 0 a22 0 a23 0 -- 16 bit long in ih264_iquant_itrans_recon_chroma_4x4_sse42()
|
D | ih264_resi_trans_quant_sse42.c | 165 temp0 = _mm_unpacklo_epi16(src_r0, src_r1); //a0 b0 a1 b1 a2 b2 a3 b3 in ih264_resi_trans_quant_4x4_sse42() 166 temp2 = _mm_unpacklo_epi16(src_r2, src_r3); //c0 d0 c1 d1 c2 d2 c3 d3 in ih264_resi_trans_quant_4x4_sse42() 203 temp0 = _mm_unpacklo_epi16(src_r0, src_r1); //a0 a1 b0 b1 c0 c1 d0 d1 in ih264_resi_trans_quant_4x4_sse42() 204 temp2 = _mm_unpacklo_epi16(src_r2, src_r3); //a2 a3 b2 b3 c2 c3 d2 d3 in ih264_resi_trans_quant_4x4_sse42() 448 temp0 = _mm_unpacklo_epi16(src_r0, src_r1); //a0 b0 a1 b1 a2 b2 a3 b3 in ih264_resi_trans_quant_chroma_4x4_sse42() 449 temp2 = _mm_unpacklo_epi16(src_r2, src_r3); //c0 d0 c1 d1 c2 d2 c3 d3 in ih264_resi_trans_quant_chroma_4x4_sse42() 486 temp0 = _mm_unpacklo_epi16(src_r0, src_r1); //a0 a1 b0 b1 c0 c1 d0 d1 in ih264_resi_trans_quant_chroma_4x4_sse42() 487 temp2 = _mm_unpacklo_epi16(src_r2, src_r3); //a2 a3 b2 b3 c2 c3 d2 d3 in ih264_resi_trans_quant_chroma_4x4_sse42() 689 src_r0 = _mm_unpacklo_epi16(src_r0_r1, sign_reg); //a0 a1 a2 a3 in ih264_hadamard_quant_4x4_sse42() 692 src_r2 = _mm_unpacklo_epi16(src_r2_r3, sign_reg); //c0 c1 c2 c3 in ih264_hadamard_quant_4x4_sse42() [all …]
|
/external/libvpx/libvpx/vpx_dsp/x86/ |
D | transpose_sse2.h | 32 return _mm_unpacklo_epi16(a0, a1); in transpose_8bit_4x4() 61 const __m128i b0 = _mm_unpacklo_epi16(a0, a1); in transpose_8bit_8x8() 63 const __m128i b2 = _mm_unpacklo_epi16(a2, a3); in transpose_8bit_8x8() 105 const __m128i a0 = _mm_unpacklo_epi16(in[0], in[1]); in transpose_16bit_4x4() 106 const __m128i a1 = _mm_unpacklo_epi16(in[2], in[3]); in transpose_16bit_4x4() 131 const __m128i a0 = _mm_unpacklo_epi16(in[0], in[1]); in transpose_16bit_4x8() 132 const __m128i a1 = _mm_unpacklo_epi16(in[2], in[3]); in transpose_16bit_4x8() 133 const __m128i a2 = _mm_unpacklo_epi16(in[4], in[5]); in transpose_16bit_4x8() 134 const __m128i a3 = _mm_unpacklo_epi16(in[6], in[7]); in transpose_16bit_4x8() 177 const __m128i a0 = _mm_unpacklo_epi16(in[0], in[1]); in transpose_16bit_8x8() [all …]
|
D | fwd_txfm_impl_sse2.h | 130 const __m128i r0 = _mm_unpacklo_epi16(in0, in1); in FDCT4x4_2D() 240 const __m128i y0 = _mm_unpacklo_epi16(x0, x1); in FDCT4x4_2D() 337 const __m128i t0 = _mm_unpacklo_epi16(r0, r1); in FDCT8x8_2D() 339 const __m128i t2 = _mm_unpacklo_epi16(r2, r3); in FDCT8x8_2D() 383 const __m128i d0 = _mm_unpacklo_epi16(q6, q5); in FDCT8x8_2D() 423 const __m128i t0 = _mm_unpacklo_epi16(x0, x3); in FDCT8x8_2D() 425 const __m128i t2 = _mm_unpacklo_epi16(x1, x2); in FDCT8x8_2D() 477 const __m128i tr0_0 = _mm_unpacklo_epi16(res0, res1); in FDCT8x8_2D() 478 const __m128i tr0_1 = _mm_unpacklo_epi16(res2, res3); in FDCT8x8_2D() 481 const __m128i tr0_4 = _mm_unpacklo_epi16(res4, res5); in FDCT8x8_2D() [all …]
|
D | inv_txfm_sse2.c | 19 const __m128i tr0_0 = _mm_unpacklo_epi16(res[0], res[1]); in transpose_16bit_4() 22 res[0] = _mm_unpacklo_epi16(tr0_0, tr0_1); in transpose_16bit_4() 91 u[0] = _mm_unpacklo_epi16(in[0], in[1]); in idct4_sse2() 117 u[0] = _mm_unpacklo_epi16(in[0], in[1]); in iadst4_sse2() 119 u[2] = _mm_unpacklo_epi16(in7, kZero); in iadst4_sse2() 276 s0 = _mm_unpacklo_epi16(in0, in1); in iadst8_sse2() 278 s2 = _mm_unpacklo_epi16(in2, in3); in iadst8_sse2() 280 s4 = _mm_unpacklo_epi16(in4, in5); in iadst8_sse2() 282 s6 = _mm_unpacklo_epi16(in6, in7); in iadst8_sse2() 370 u0 = _mm_unpacklo_epi16(in[4], in[5]); in iadst8_sse2() [all …]
|
D | fwd_dct32x32_impl_sse2.h | 395 const __m128i s2_20_0 = _mm_unpacklo_epi16(step1[27], step1[20]); in FDCT32x32_2D() 397 const __m128i s2_21_0 = _mm_unpacklo_epi16(step1[26], step1[21]); in FDCT32x32_2D() 399 const __m128i s2_22_0 = _mm_unpacklo_epi16(step1[25], step1[22]); in FDCT32x32_2D() 401 const __m128i s2_23_0 = _mm_unpacklo_epi16(step1[24], step1[23]); in FDCT32x32_2D() 652 const __m128i s3_10_0 = _mm_unpacklo_epi16(step2[13], step2[10]); in FDCT32x32_2D() 654 const __m128i s3_11_0 = _mm_unpacklo_epi16(step2[12], step2[11]); in FDCT32x32_2D() 760 const __m128i s1_05_0 = _mm_unpacklo_epi16(step3[6], step3[5]); in FDCT32x32_2D() 790 const __m128i s1_18_0 = _mm_unpacklo_epi16(step3[18], step3[29]); in FDCT32x32_2D() 792 const __m128i s1_19_0 = _mm_unpacklo_epi16(step3[19], step3[28]); in FDCT32x32_2D() 794 const __m128i s1_20_0 = _mm_unpacklo_epi16(step3[20], step3[27]); in FDCT32x32_2D() [all …]
|
D | inv_txfm_sse2.h | 35 const __m128i tr0_1 = _mm_unpacklo_epi16(in[1], in[0]); in idct8x8_12_transpose_16bit_4x8() 36 const __m128i tr0_2 = _mm_unpacklo_epi16(in[2], in[3]); in idct8x8_12_transpose_16bit_4x8() 86 const __m128i lo = _mm_unpacklo_epi16(in0, in1); in butterfly() 94 const __m128i lo = _mm_unpacklo_epi16(in, _mm_setzero_si128()); in butterfly_cospi16() 311 const __m128i lo_0 = _mm_unpacklo_epi16(io[0], zero); in idct8x8_12_add_kernel_sse2() 312 const __m128i lo_2 = _mm_unpacklo_epi16(io[1], zero); in idct8x8_12_add_kernel_sse2() 323 const __m128i lo_65 = _mm_unpacklo_epi16(step2[6], step2[5]); in idct8x8_12_add_kernel_sse2() 456 const __m128i lo_2_14 = _mm_unpacklo_epi16(output[1], zero); in idct16x16_10_pass1() 468 const __m128i lo_0_8 = _mm_unpacklo_epi16(output[0], zero); in idct16x16_10_pass1() 469 const __m128i lo_9_14 = _mm_unpacklo_epi16(step2[8], step1[14]); in idct16x16_10_pass1() [all …]
|
/external/libhevc/common/x86/ |
D | ihevc_itrans_recon_ssse3_intr.c | 172 m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_0, m_ge_zero16b_flag_row0); in ihevc_itrans_recon_4x4_ttype1_ssse3() 173 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_1, m_ge_zero16b_flag_row1); in ihevc_itrans_recon_4x4_ttype1_ssse3() 174 m_temp_reg_2 = _mm_unpacklo_epi16(m_temp_reg_2, m_ge_zero16b_flag_row2); in ihevc_itrans_recon_4x4_ttype1_ssse3() 175 m_temp_reg_3 = _mm_unpacklo_epi16(m_temp_reg_3, m_ge_zero16b_flag_row3); in ihevc_itrans_recon_4x4_ttype1_ssse3() 295 m_temp_reg_24 = _mm_unpacklo_epi16(m_temp_reg_20, m_temp_reg_22); in ihevc_itrans_recon_4x4_ttype1_ssse3() 296 m_temp_reg_25 = _mm_unpacklo_epi16(m_temp_reg_21, m_temp_reg_23); in ihevc_itrans_recon_4x4_ttype1_ssse3() 317 m_temp_reg_20 = _mm_unpacklo_epi16(m_temp_reg_30, m_ge_zero16b_flag_row0); in ihevc_itrans_recon_4x4_ttype1_ssse3() 318 m_temp_reg_21 = _mm_unpacklo_epi16(m_temp_reg_31, m_ge_zero16b_flag_row1); in ihevc_itrans_recon_4x4_ttype1_ssse3() 433 m_temp_reg_24 = _mm_unpacklo_epi16(m_temp_reg_20, m_temp_reg_22); in ihevc_itrans_recon_4x4_ttype1_ssse3() 434 m_temp_reg_25 = _mm_unpacklo_epi16(m_temp_reg_21, m_temp_reg_23); in ihevc_itrans_recon_4x4_ttype1_ssse3() [all …]
|
D | ihevc_itrans_recon_sse42_intr.c | 246 m_temp_reg_24 = _mm_unpacklo_epi16(m_temp_reg_20, m_temp_reg_22); in ihevc_itrans_recon_4x4_ttype1_sse42() 247 m_temp_reg_25 = _mm_unpacklo_epi16(m_temp_reg_21, m_temp_reg_23); in ihevc_itrans_recon_4x4_ttype1_sse42() 337 m_temp_reg_24 = _mm_unpacklo_epi16(m_temp_reg_20, m_temp_reg_22); in ihevc_itrans_recon_4x4_ttype1_sse42() 338 m_temp_reg_25 = _mm_unpacklo_epi16(m_temp_reg_21, m_temp_reg_23); in ihevc_itrans_recon_4x4_ttype1_sse42() 572 m_temp_reg_24 = _mm_unpacklo_epi16(m_temp_reg_20, m_temp_reg_22); in ihevc_itrans_recon_4x4_sse42() 573 m_temp_reg_25 = _mm_unpacklo_epi16(m_temp_reg_21, m_temp_reg_23); in ihevc_itrans_recon_4x4_sse42() 664 m_temp_reg_24 = _mm_unpacklo_epi16(m_temp_reg_20, m_temp_reg_22); in ihevc_itrans_recon_4x4_sse42() 665 m_temp_reg_25 = _mm_unpacklo_epi16(m_temp_reg_21, m_temp_reg_23); in ihevc_itrans_recon_4x4_sse42() 885 m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_74); in ihevc_itrans_recon_8x8_sse42() 903 m_temp_reg_4 = _mm_unpacklo_epi16(m_temp_reg_72, m_temp_reg_76); in ihevc_itrans_recon_8x8_sse42() [all …]
|
D | ihevc_weighted_pred_ssse3_intr.c | 150 lvl_shift_4x32b = _mm_unpacklo_epi16(res_temp0_4x32b, res_temp1_4x32b); in ihevc_weighted_pred_uni_ssse3() 191 res_temp0_4x32b = _mm_unpacklo_epi16(res_temp0_4x32b, src_temp0_8x16b); in ihevc_weighted_pred_uni_ssse3() 192 res_temp1_4x32b = _mm_unpacklo_epi16(res_temp1_4x32b, src_temp1_8x16b); in ihevc_weighted_pred_uni_ssse3() 193 res_temp2_4x32b = _mm_unpacklo_epi16(res_temp2_4x32b, src_temp2_8x16b); in ihevc_weighted_pred_uni_ssse3() 194 res_temp3_4x32b = _mm_unpacklo_epi16(res_temp3_4x32b, src_temp3_8x16b); in ihevc_weighted_pred_uni_ssse3() 290 res_temp0_4x32b = _mm_unpacklo_epi16(res_temp0_4x32b, src_temp0_8x16b); in ihevc_weighted_pred_uni_ssse3() 291 res_temp1_4x32b = _mm_unpacklo_epi16(res_temp1_4x32b, src_temp1_8x16b); in ihevc_weighted_pred_uni_ssse3() 440 lvl_shift_4x32b = _mm_unpacklo_epi16(res_temp0_4x32b, res_temp1_4x32b); in ihevc_weighted_pred_chroma_uni_ssse3() 483 res_temp0_4x32b = _mm_unpacklo_epi16(res_temp0_4x32b, src_temp0_8x16b); in ihevc_weighted_pred_chroma_uni_ssse3() 484 res_temp1_4x32b = _mm_unpacklo_epi16(res_temp1_4x32b, src_temp1_8x16b); in ihevc_weighted_pred_chroma_uni_ssse3() [all …]
|
D | ihevc_itrans_recon_16x16_ssse3_intr.c | 241 m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_77); //row 0 in ihevc_itrans_recon_16x16_ssse3() 259 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_16x16_ssse3() 409 …m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_72, m_temp_reg_76); //row 4 and row 12 interleaved LS… in ihevc_itrans_recon_16x16_ssse3() 426 m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_77); //row 0 in ihevc_itrans_recon_16x16_ssse3() 443 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_16x16_ssse3() 605 …m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_72, m_temp_reg_76); //row 4 and row 12 interleaved LS… in ihevc_itrans_recon_16x16_ssse3() 623 …m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_74); //row 0 and row 8 interleaved LSB… in ihevc_itrans_recon_16x16_ssse3() 638 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_16x16_ssse3() 640 m_temp_reg_12 = _mm_unpacklo_epi16(m_temp_reg_75, m_temp_reg_77); in ihevc_itrans_recon_16x16_ssse3() 859 … m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_71); //row 1 and row 3 L8B in ihevc_itrans_recon_16x16_ssse3() [all …]
|
D | ihevc_16x16_itrans_recon_sse42_intr.c | 235 m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_77); //row 0 in ihevc_itrans_recon_16x16_sse42() 253 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_16x16_sse42() 403 …m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_72, m_temp_reg_76); //row 4 and row 12 interleaved LS… in ihevc_itrans_recon_16x16_sse42() 420 m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_77); //row 0 in ihevc_itrans_recon_16x16_sse42() 439 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_16x16_sse42() 601 …m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_72, m_temp_reg_76); //row 4 and row 12 interleaved LS… in ihevc_itrans_recon_16x16_sse42() 619 …m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_74); //row 0 and row 8 interleaved LSB… in ihevc_itrans_recon_16x16_sse42() 634 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_16x16_sse42() 636 m_temp_reg_12 = _mm_unpacklo_epi16(m_temp_reg_75, m_temp_reg_77); in ihevc_itrans_recon_16x16_sse42() 855 … m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_71); //row 1 and row 3 L8B in ihevc_itrans_recon_16x16_sse42() [all …]
|
D | ihevc_itrans_recon_32x32_ssse3_intr.c | 302 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_70, all_zero_reg); in ihevc_itrans_recon_32x32_ssse3() 325 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_70, all_zero_reg); in ihevc_itrans_recon_32x32_ssse3() 362 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, all_zero_reg); in ihevc_itrans_recon_32x32_ssse3() 371 m_temp_reg_14 = _mm_unpacklo_epi16(m_temp_reg_71, all_zero_reg); in ihevc_itrans_recon_32x32_ssse3() 615 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_70, all_zero_reg); in ihevc_itrans_recon_32x32_ssse3() 640 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_70, all_zero_reg); in ihevc_itrans_recon_32x32_ssse3() 670 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_72, all_zero_reg); in ihevc_itrans_recon_32x32_ssse3() 674 m_temp_reg_14 = _mm_unpacklo_epi16(m_temp_reg_72, all_zero_reg); in ihevc_itrans_recon_32x32_ssse3() 795 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_32x32_ssse3() 823 m_temp_reg_14 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_32x32_ssse3() [all …]
|
D | ihevc_32x32_itrans_recon_sse42_intr.c | 293 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_70, all_zero_reg); in ihevc_itrans_recon_32x32_sse42() 316 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_70, all_zero_reg); in ihevc_itrans_recon_32x32_sse42() 352 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, all_zero_reg); in ihevc_itrans_recon_32x32_sse42() 360 m_temp_reg_14 = _mm_unpacklo_epi16(m_temp_reg_71, all_zero_reg); in ihevc_itrans_recon_32x32_sse42() 604 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_70, all_zero_reg); in ihevc_itrans_recon_32x32_sse42() 629 m_temp_reg_1 = _mm_unpacklo_epi16(m_temp_reg_70, all_zero_reg); in ihevc_itrans_recon_32x32_sse42() 659 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_72, all_zero_reg); in ihevc_itrans_recon_32x32_sse42() 663 m_temp_reg_14 = _mm_unpacklo_epi16(m_temp_reg_72, all_zero_reg); in ihevc_itrans_recon_32x32_sse42() 784 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_32x32_sse42() 813 m_temp_reg_14 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in ihevc_itrans_recon_32x32_sse42() [all …]
|
/external/libmpeg2/common/x86/ |
D | impeg2_idct_recon_sse42_intr.c | 223 m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_74); in impeg2_idct_recon_sse42() 241 m_temp_reg_4 = _mm_unpacklo_epi16(m_temp_reg_72, m_temp_reg_76); in impeg2_idct_recon_sse42() 277 m_temp_reg_60 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in impeg2_idct_recon_sse42() 399 m_temp_reg_10 = _mm_unpacklo_epi16(m_temp_reg_50, m_temp_reg_51); in impeg2_idct_recon_sse42() 400 m_temp_reg_11 = _mm_unpacklo_epi16(m_temp_reg_52, m_temp_reg_53); in impeg2_idct_recon_sse42() 404 m_temp_reg_12 = _mm_unpacklo_epi16(m_temp_reg_54, m_temp_reg_55); in impeg2_idct_recon_sse42() 405 m_temp_reg_13 = _mm_unpacklo_epi16(m_temp_reg_56, m_temp_reg_57); in impeg2_idct_recon_sse42() 431 m_temp_reg_0 = _mm_unpacklo_epi16(m_temp_reg_70, m_temp_reg_74); in impeg2_idct_recon_sse42() 449 m_temp_reg_4 = _mm_unpacklo_epi16(m_temp_reg_72, m_temp_reg_76); in impeg2_idct_recon_sse42() 485 m_temp_reg_60 = _mm_unpacklo_epi16(m_temp_reg_71, m_temp_reg_73); in impeg2_idct_recon_sse42() [all …]
|
/external/libvpx/libvpx/vp9/encoder/x86/ |
D | vp9_dct_intrin_sse2.c | 59 const __m128i tr0_0 = _mm_unpacklo_epi16(res[0], res[1]); in transpose_4x4() 82 u[0] = _mm_unpacklo_epi16(in[0], in[1]); in fdct4_sse2() 83 u[1] = _mm_unpacklo_epi16(in[3], in[2]); in fdct4_sse2() 118 u[0] = _mm_unpacklo_epi16(in[0], in[1]); in fadst4_sse2() 119 u[1] = _mm_unpacklo_epi16(in[2], in[3]); in fadst4_sse2() 120 u[2] = _mm_unpacklo_epi16(in7, kZero); in fadst4_sse2() 121 u[3] = _mm_unpacklo_epi16(in[2], kZero); in fadst4_sse2() 122 u[4] = _mm_unpacklo_epi16(in[3], kZero); in fadst4_sse2() 264 const __m128i t0 = _mm_unpacklo_epi16(r0, r1); in vp9_fdct8x8_quant_sse2() 266 const __m128i t2 = _mm_unpacklo_epi16(r2, r3); in vp9_fdct8x8_quant_sse2() [all …]
|
D | vp9_dct_ssse3.c | 101 const __m128i t0 = _mm_unpacklo_epi16(r0, r1); in vp9_fdct8x8_quant_ssse3() 103 const __m128i t2 = _mm_unpacklo_epi16(r2, r3); in vp9_fdct8x8_quant_ssse3() 157 const __m128i t0 = _mm_unpacklo_epi16(x0, x3); in vp9_fdct8x8_quant_ssse3() 159 const __m128i t2 = _mm_unpacklo_epi16(x1, x2); in vp9_fdct8x8_quant_ssse3() 202 const __m128i tr0_0 = _mm_unpacklo_epi16(res0, res1); in vp9_fdct8x8_quant_ssse3() 203 const __m128i tr0_1 = _mm_unpacklo_epi16(res2, res3); in vp9_fdct8x8_quant_ssse3() 206 const __m128i tr0_4 = _mm_unpacklo_epi16(res4, res5); in vp9_fdct8x8_quant_ssse3() 207 const __m128i tr0_5 = _mm_unpacklo_epi16(res6, res7); in vp9_fdct8x8_quant_ssse3()
|
/external/tensorflow/tensorflow/core/kernels/ |
D | sparse_matmul_op.h | 196 return _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp)); 204 return _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp)); 213 return _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp)); in pexpand_bf16_l() 348 _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp))); 356 _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp))); 366 _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp))); 374 _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp))); 389 __m128i res_l = _mm_unpacklo_epi16(zero, low); in pexpand_bf16_l() 391 __m128i res_h = _mm_unpacklo_epi16(zero, high); in pexpand_bf16_l()
|
/external/skqp/src/opts/ |
D | SkNx_sse.h | 330 __m128i even = _mm_unpacklo_epi16(lo, hi), // r0 r2 g0 g2 b0 b2 a0 a2 in Load4() 332 __m128i rg = _mm_unpacklo_epi16(even, odd), // r0 r1 r2 r3 g0 g1 g2 g3 in Load4() 349 __m128i rrggbb01 = _mm_unpacklo_epi16(rgb0, rgb1); in Load3() 350 __m128i rrggbb23 = _mm_unpacklo_epi16(rgb2, rgb3); in Load3() 356 __m128i rg = _mm_unpacklo_epi16(r.fVec, g.fVec); in Store4() 357 __m128i ba = _mm_unpacklo_epi16(b.fVec, a.fVec); in Store4() 402 __m128i _02 = _mm_unpacklo_epi16(_01, _23), // r0 r2 g0 g2 b0 b2 a0 a2 in Load4() 404 _46 = _mm_unpacklo_epi16(_45, _67), in Load4() 407 __m128i rg0123 = _mm_unpacklo_epi16(_02, _13), // r0 r1 r2 r3 g0 g1 g2 g3 in Load4() 409 rg4567 = _mm_unpacklo_epi16(_46, _57), in Load4() [all …]
|
/external/skia/src/opts/ |
D | SkNx_sse.h | 337 __m128i even = _mm_unpacklo_epi16(lo, hi), // r0 r2 g0 g2 b0 b2 a0 a2 in Load4() 339 __m128i rg = _mm_unpacklo_epi16(even, odd), // r0 r1 r2 r3 g0 g1 g2 g3 in Load4() 356 __m128i rrggbb01 = _mm_unpacklo_epi16(rgb0, rgb1); in Load3() 357 __m128i rrggbb23 = _mm_unpacklo_epi16(rgb2, rgb3); in Load3() 363 __m128i rg = _mm_unpacklo_epi16(r.fVec, g.fVec); in Store4() 364 __m128i ba = _mm_unpacklo_epi16(b.fVec, a.fVec); in Store4() 409 __m128i _02 = _mm_unpacklo_epi16(_01, _23), // r0 r2 g0 g2 b0 b2 a0 a2 in Load4() 411 _46 = _mm_unpacklo_epi16(_45, _67), in Load4() 414 __m128i rg0123 = _mm_unpacklo_epi16(_02, _13), // r0 r1 r2 r3 g0 g1 g2 g3 in Load4() 416 rg4567 = _mm_unpacklo_epi16(_46, _57), in Load4() [all …]
|
/external/libavc/encoder/x86/ |
D | ih264e_half_pel_ssse3.c | 403 src_r0r1_8x16b = _mm_unpacklo_epi16(src_r0_8x16b, src_r1_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 404 src_r2r3_8x16b = _mm_unpacklo_epi16(src_r2_8x16b, src_r3_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 405 src_r4r5_8x16b = _mm_unpacklo_epi16(src_r4_8x16b, src_r5_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 441 src_r0r1_8x16b = _mm_unpacklo_epi16(src_r0_8x16b, src_r1_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 442 src_r2r3_8x16b = _mm_unpacklo_epi16(src_r2_8x16b, src_r3_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 443 src_r4r5_8x16b = _mm_unpacklo_epi16(src_r4_8x16b, src_r5_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3()
|