/external/libhevc/common/x86/ |
D | ihevc_32x32_itrans_recon_sse42_intr.c | 295 m_temp_reg_14 = _mm_madd_epi16(m_temp_reg_1, m_coeff3); in ihevc_itrans_recon_32x32_sse42() 318 m_temp_reg_14 = _mm_madd_epi16(m_temp_reg_1, m_coeff3); in ihevc_itrans_recon_32x32_sse42() 358 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); in ihevc_itrans_recon_32x32_sse42() 374 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff1); in ihevc_itrans_recon_32x32_sse42() 387 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff2); in ihevc_itrans_recon_32x32_sse42() 401 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff2); in ihevc_itrans_recon_32x32_sse42() 415 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff3); in ihevc_itrans_recon_32x32_sse42() 429 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff3); in ihevc_itrans_recon_32x32_sse42() 446 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff4); in ihevc_itrans_recon_32x32_sse42() 460 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff4); in ihevc_itrans_recon_32x32_sse42() [all …]
|
D | ihevc_itrans_recon_32x32_ssse3_intr.c | 304 m_temp_reg_14 = _mm_madd_epi16(m_temp_reg_1, m_coeff3); in ihevc_itrans_recon_32x32_ssse3() 327 m_temp_reg_14 = _mm_madd_epi16(m_temp_reg_1, m_coeff3); in ihevc_itrans_recon_32x32_ssse3() 368 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); in ihevc_itrans_recon_32x32_ssse3() 385 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff1); in ihevc_itrans_recon_32x32_ssse3() 398 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff2); in ihevc_itrans_recon_32x32_ssse3() 412 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff2); in ihevc_itrans_recon_32x32_ssse3() 426 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff3); in ihevc_itrans_recon_32x32_ssse3() 440 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff3); in ihevc_itrans_recon_32x32_ssse3() 457 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff4); in ihevc_itrans_recon_32x32_ssse3() 471 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff4); in ihevc_itrans_recon_32x32_ssse3() [all …]
|
D | ihevc_itrans_recon_16x16_ssse3_intr.c | 262 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); in ihevc_itrans_recon_16x16_ssse3() 281 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff1); in ihevc_itrans_recon_16x16_ssse3() 300 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff3); in ihevc_itrans_recon_16x16_ssse3() 317 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff3); in ihevc_itrans_recon_16x16_ssse3() 337 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); in ihevc_itrans_recon_16x16_ssse3() 353 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff1); in ihevc_itrans_recon_16x16_ssse3() 371 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff3); in ihevc_itrans_recon_16x16_ssse3() 386 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff3); in ihevc_itrans_recon_16x16_ssse3() 412 m_temp_reg_20 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); in ihevc_itrans_recon_16x16_ssse3() 413 m_temp_reg_22 = _mm_madd_epi16(m_temp_reg_0, m_coeff2); in ihevc_itrans_recon_16x16_ssse3() [all …]
|
D | ihevc_16x16_itrans_recon_sse42_intr.c | 256 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); in ihevc_itrans_recon_16x16_sse42() 275 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff1); in ihevc_itrans_recon_16x16_sse42() 294 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff3); in ihevc_itrans_recon_16x16_sse42() 311 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff3); in ihevc_itrans_recon_16x16_sse42() 331 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); in ihevc_itrans_recon_16x16_sse42() 347 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff1); in ihevc_itrans_recon_16x16_sse42() 365 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff3); in ihevc_itrans_recon_16x16_sse42() 380 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff3); in ihevc_itrans_recon_16x16_sse42() 406 m_temp_reg_20 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); in ihevc_itrans_recon_16x16_sse42() 407 m_temp_reg_22 = _mm_madd_epi16(m_temp_reg_0, m_coeff2); in ihevc_itrans_recon_16x16_sse42() [all …]
|
D | ihevc_itrans_recon_sse42_intr.c | 887 m_temp_reg_10 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); in ihevc_itrans_recon_8x8_sse42() 888 m_temp_reg_12 = _mm_madd_epi16(m_temp_reg_0, m_coeff2); in ihevc_itrans_recon_8x8_sse42() 905 m_temp_reg_16 = _mm_madd_epi16(m_temp_reg_4, m_coeff1); in ihevc_itrans_recon_8x8_sse42() 906 m_temp_reg_14 = _mm_madd_epi16(m_temp_reg_4, m_coeff2); in ihevc_itrans_recon_8x8_sse42() 941 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_60, m_coeff1); in ihevc_itrans_recon_8x8_sse42() 967 m_temp_reg_32 = _mm_madd_epi16(m_temp_reg_60, m_coeff3); in ihevc_itrans_recon_8x8_sse42() 996 m_temp_reg_34 = _mm_madd_epi16(m_temp_reg_60, m_coeff1); in ihevc_itrans_recon_8x8_sse42() 1026 m_temp_reg_36 = _mm_madd_epi16(m_temp_reg_60, m_coeff3); in ihevc_itrans_recon_8x8_sse42() 1095 m_temp_reg_10 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); in ihevc_itrans_recon_8x8_sse42() 1096 m_temp_reg_12 = _mm_madd_epi16(m_temp_reg_0, m_coeff2); in ihevc_itrans_recon_8x8_sse42() [all …]
|
D | ihevc_itrans_recon_ssse3_intr.c | 1066 m_temp_reg_10 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); in ihevc_itrans_recon_8x8_ssse3() 1067 m_temp_reg_12 = _mm_madd_epi16(m_temp_reg_0, m_coeff2); in ihevc_itrans_recon_8x8_ssse3() 1084 m_temp_reg_16 = _mm_madd_epi16(m_temp_reg_4, m_coeff1); in ihevc_itrans_recon_8x8_ssse3() 1085 m_temp_reg_14 = _mm_madd_epi16(m_temp_reg_4, m_coeff2); in ihevc_itrans_recon_8x8_ssse3() 1120 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_60, m_coeff1); in ihevc_itrans_recon_8x8_ssse3() 1146 m_temp_reg_32 = _mm_madd_epi16(m_temp_reg_60, m_coeff3); in ihevc_itrans_recon_8x8_ssse3() 1175 m_temp_reg_34 = _mm_madd_epi16(m_temp_reg_60, m_coeff1); in ihevc_itrans_recon_8x8_ssse3() 1205 m_temp_reg_36 = _mm_madd_epi16(m_temp_reg_60, m_coeff3); in ihevc_itrans_recon_8x8_ssse3() 1286 m_temp_reg_10 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); in ihevc_itrans_recon_8x8_ssse3() 1287 m_temp_reg_12 = _mm_madd_epi16(m_temp_reg_0, m_coeff2); in ihevc_itrans_recon_8x8_ssse3() [all …]
|
D | ihevc_inter_pred_filters_ssse3_intr.c | 2686 s0_8x16b = _mm_madd_epi16(s3_0_16x8b, coeff0_1_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2696 s1_8x16b = _mm_madd_epi16(s3_1_16x8b, coeff2_3_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2706 s2_8x16b = _mm_madd_epi16(s3_2_16x8b, coeff4_5_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2716 s3_8x16b = _mm_madd_epi16(s3_3_16x8b, coeff6_7_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2747 s20_8x16b = _mm_madd_epi16(s3_1_16x8b, coeff0_1_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2748 s21_8x16b = _mm_madd_epi16(s3_2_16x8b, coeff2_3_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2749 s22_8x16b = _mm_madd_epi16(s3_3_16x8b, coeff4_5_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2759 s23_8x16b = _mm_madd_epi16(s3_4_16x8b, coeff6_7_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2793 s10_8x16b = _mm_madd_epi16(s4_0_16x8b, coeff0_1_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() 2797 s11_8x16b = _mm_madd_epi16(s4_1_16x8b, coeff2_3_8x16b); in ihevc_inter_pred_luma_vert_w16inp_ssse3() [all …]
|
/external/libvpx/libvpx/vp9/encoder/x86/ |
D | vp9_dct_sse2.c | 87 u[0] = _mm_madd_epi16(v[0], k__cospi_p16_p16); // 0 in fdct4_sse2() 88 u[1] = _mm_madd_epi16(v[0], k__cospi_p16_m16); // 2 in fdct4_sse2() 89 u[2] = _mm_madd_epi16(v[1], k__cospi_p08_p24); // 1 in fdct4_sse2() 90 u[3] = _mm_madd_epi16(v[1], k__cospi_p24_m08); // 3 in fdct4_sse2() 123 v[0] = _mm_madd_epi16(u[0], k__sinpi_p01_p02); // s0 + s2 in fadst4_sse2() 124 v[1] = _mm_madd_epi16(u[1], k__sinpi_p03_p04); // s4 + s5 in fadst4_sse2() 125 v[2] = _mm_madd_epi16(u[2], k__sinpi_p03_p03); // x1 in fadst4_sse2() 126 v[3] = _mm_madd_epi16(u[0], k__sinpi_p04_m01); // s1 - s3 in fadst4_sse2() 127 v[4] = _mm_madd_epi16(u[1], k__sinpi_m03_p02); // -s4 + s6 in fadst4_sse2() 128 v[5] = _mm_madd_epi16(u[3], k__sinpi_p03_p03); // s4 in fadst4_sse2() [all …]
|
D | vp9_dct_ssse3.c | 114 const __m128i u0 = _mm_madd_epi16(t0, k__cospi_p16_p16); in vp9_fdct8x8_quant_ssse3() 115 const __m128i u1 = _mm_madd_epi16(t1, k__cospi_p16_p16); in vp9_fdct8x8_quant_ssse3() 116 const __m128i u2 = _mm_madd_epi16(t0, k__cospi_p16_m16); in vp9_fdct8x8_quant_ssse3() 117 const __m128i u3 = _mm_madd_epi16(t1, k__cospi_p16_m16); in vp9_fdct8x8_quant_ssse3() 119 const __m128i u4 = _mm_madd_epi16(t2, k__cospi_p24_p08); in vp9_fdct8x8_quant_ssse3() 120 const __m128i u5 = _mm_madd_epi16(t3, k__cospi_p24_p08); in vp9_fdct8x8_quant_ssse3() 121 const __m128i u6 = _mm_madd_epi16(t2, k__cospi_m08_p24); in vp9_fdct8x8_quant_ssse3() 122 const __m128i u7 = _mm_madd_epi16(t3, k__cospi_m08_p24); in vp9_fdct8x8_quant_ssse3() 169 const __m128i u0 = _mm_madd_epi16(t0, k__cospi_p28_p04); in vp9_fdct8x8_quant_ssse3() 170 const __m128i u1 = _mm_madd_epi16(t1, k__cospi_p28_p04); in vp9_fdct8x8_quant_ssse3() [all …]
|
D | vp9_highbd_block_error_intrin_sse2.c | 51 error_sse2 = _mm_madd_epi16(mm_diff, mm_diff); in vp9_highbd_block_error_sse2() 52 sqcoeff_sse2 = _mm_madd_epi16(mm_coeff, mm_coeff); in vp9_highbd_block_error_sse2()
|
/external/libmpeg2/common/x86/ |
D | impeg2_idct_recon_sse42_intr.c | 225 m_temp_reg_10 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); in impeg2_idct_recon_sse42() 226 m_temp_reg_12 = _mm_madd_epi16(m_temp_reg_0, m_coeff2); in impeg2_idct_recon_sse42() 243 m_temp_reg_16 = _mm_madd_epi16(m_temp_reg_4, m_coeff1); in impeg2_idct_recon_sse42() 244 m_temp_reg_14 = _mm_madd_epi16(m_temp_reg_4, m_coeff2); in impeg2_idct_recon_sse42() 279 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_60, m_coeff1); in impeg2_idct_recon_sse42() 305 m_temp_reg_32 = _mm_madd_epi16(m_temp_reg_60, m_coeff3); in impeg2_idct_recon_sse42() 334 m_temp_reg_34 = _mm_madd_epi16(m_temp_reg_60, m_coeff1); in impeg2_idct_recon_sse42() 364 m_temp_reg_36 = _mm_madd_epi16(m_temp_reg_60, m_coeff3); in impeg2_idct_recon_sse42() 433 m_temp_reg_10 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); in impeg2_idct_recon_sse42() 434 m_temp_reg_12 = _mm_madd_epi16(m_temp_reg_0, m_coeff2); in impeg2_idct_recon_sse42() [all …]
|
D | icv_variance_ssse3.c | 140 sqr_r0 = _mm_madd_epi16(ssrc_r0, ssrc_r0); in icv_variance_8x4_ssse3() 141 sqr_r1 = _mm_madd_epi16(ssrc_r1, ssrc_r1); in icv_variance_8x4_ssse3() 142 sqr_r2 = _mm_madd_epi16(ssrc_r2, ssrc_r2); in icv_variance_8x4_ssse3() 143 sqr_r3 = _mm_madd_epi16(ssrc_r3, ssrc_r3); in icv_variance_8x4_ssse3()
|
/external/libvpx/libvpx/vpx_dsp/x86/ |
D | inv_txfm_sse2.c | 50 input0 = _mm_madd_epi16(input0, cst); in vpx_idct4x4_16_add_sse2() 51 input1 = _mm_madd_epi16(input1, cst); in vpx_idct4x4_16_add_sse2() 52 input2 = _mm_madd_epi16(input2, cst); in vpx_idct4x4_16_add_sse2() 53 input3 = _mm_madd_epi16(input3, cst); in vpx_idct4x4_16_add_sse2() 89 input0 = _mm_madd_epi16(input0, cst); in vpx_idct4x4_16_add_sse2() 90 input1 = _mm_madd_epi16(input1, cst); in vpx_idct4x4_16_add_sse2() 91 input2 = _mm_madd_epi16(input2, cst); in vpx_idct4x4_16_add_sse2() 92 input3 = _mm_madd_epi16(input3, cst); in vpx_idct4x4_16_add_sse2() 191 v[0] = _mm_madd_epi16(u[0], k__cospi_p16_p16); in idct4_sse2() 192 v[1] = _mm_madd_epi16(u[0], k__cospi_p16_m16); in idct4_sse2() [all …]
|
D | fwd_dct32x32_impl_sse2.h | 409 const __m128i s2_20_2 = _mm_madd_epi16(s2_20_0, k__cospi_p16_m16); in FDCT32x32_2D() 410 const __m128i s2_20_3 = _mm_madd_epi16(s2_20_1, k__cospi_p16_m16); in FDCT32x32_2D() 411 const __m128i s2_21_2 = _mm_madd_epi16(s2_21_0, k__cospi_p16_m16); in FDCT32x32_2D() 412 const __m128i s2_21_3 = _mm_madd_epi16(s2_21_1, k__cospi_p16_m16); in FDCT32x32_2D() 413 const __m128i s2_22_2 = _mm_madd_epi16(s2_22_0, k__cospi_p16_m16); in FDCT32x32_2D() 414 const __m128i s2_22_3 = _mm_madd_epi16(s2_22_1, k__cospi_p16_m16); in FDCT32x32_2D() 415 const __m128i s2_23_2 = _mm_madd_epi16(s2_23_0, k__cospi_p16_m16); in FDCT32x32_2D() 416 const __m128i s2_23_3 = _mm_madd_epi16(s2_23_1, k__cospi_p16_m16); in FDCT32x32_2D() 417 const __m128i s2_24_2 = _mm_madd_epi16(s2_23_0, k__cospi_p16_p16); in FDCT32x32_2D() 418 const __m128i s2_24_3 = _mm_madd_epi16(s2_23_1, k__cospi_p16_p16); in FDCT32x32_2D() [all …]
|
D | fwd_txfm_impl_sse2.h | 158 const __m128i u0 = _mm_madd_epi16(t0, k__cospi_A); in FDCT4x4_2D() 159 const __m128i u2 = _mm_madd_epi16(t0, k__cospi_B); in FDCT4x4_2D() 160 const __m128i u1 = _mm_madd_epi16(t1, k__cospi_C); in FDCT4x4_2D() 161 const __m128i u3 = _mm_madd_epi16(t1, k__cospi_D); in FDCT4x4_2D() 214 const __m128i u0 = _mm_madd_epi16(t0, k__cospi_E); in FDCT4x4_2D() 215 const __m128i u1 = _mm_madd_epi16(t0, k__cospi_F); in FDCT4x4_2D() 216 const __m128i u2 = _mm_madd_epi16(t1, k__cospi_G); in FDCT4x4_2D() 217 const __m128i u3 = _mm_madd_epi16(t1, k__cospi_H); in FDCT4x4_2D() 350 const __m128i u0 = _mm_madd_epi16(t0, k__cospi_p16_p16); in FDCT8x8_2D() 351 const __m128i u1 = _mm_madd_epi16(t1, k__cospi_p16_p16); in FDCT8x8_2D() [all …]
|
D | variance_sse2.c | 28 vsum = _mm_add_epi32(vsum, _mm_madd_epi16(v, v)); in vpx_get_mb_ss_sse2() 60 vsum = _mm_add_epi32(_mm_madd_epi16(diff0, diff0), in get4x4var_sse2() 61 _mm_madd_epi16(diff1, diff1)); in get4x4var_sse2() 90 vsse = _mm_add_epi32(vsse, _mm_madd_epi16(diff0, diff0)); in vpx_get8x8var_sse2() 91 vsse = _mm_add_epi32(vsse, _mm_madd_epi16(diff1, diff1)); in vpx_get8x8var_sse2() 128 vsse = _mm_add_epi32(vsse, _mm_madd_epi16(diff0, diff0)); in vpx_get16x16var_sse2() 129 vsse = _mm_add_epi32(vsse, _mm_madd_epi16(diff1, diff1)); in vpx_get16x16var_sse2()
|
/external/libavc/encoder/x86/ |
D | ih264e_half_pel_ssse3.c | 407 res_t1_4x32b = _mm_madd_epi16(src_r0r1_8x16b, coeff0_1_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 408 res_t2_4x32b = _mm_madd_epi16(src_r2r3_8x16b, coeff2_3_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 409 res_t3_4x32b = _mm_madd_epi16(src_r4r5_8x16b, coeff4_5_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 420 res_t1_4x32b = _mm_madd_epi16(src_r0r1_8x16b, coeff0_1_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 421 res_t2_4x32b = _mm_madd_epi16(src_r2r3_8x16b, coeff2_3_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 422 res_t3_4x32b = _mm_madd_epi16(src_r4r5_8x16b, coeff4_5_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 445 res_t1_4x32b = _mm_madd_epi16(src_r0r1_8x16b, coeff0_1_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 446 res_t2_4x32b = _mm_madd_epi16(src_r2r3_8x16b, coeff2_3_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 447 res_t3_4x32b = _mm_madd_epi16(src_r4r5_8x16b, coeff4_5_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 458 res_t1_4x32b = _mm_madd_epi16(src_r0r1_8x16b, coeff0_1_8x16b); in ih264e_sixtap_filter_2dvh_vert_ssse3() [all …]
|
/external/libavc/common/x86/ |
D | ih264_inter_pred_filters_ssse3.c | 898 res_t1_4x32b = _mm_madd_epi16(src_r0_8x16b, coeff0_1_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 899 res_t2_4x32b = _mm_madd_epi16(src_t1_8x16b, coeff2_3_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 900 res_t3_4x32b = _mm_madd_epi16(src_t2_8x16b, coeff4_5_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 912 res_t1_4x32b = _mm_madd_epi16(src_r1_8x16b, coeff0_1_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 913 res_t2_4x32b = _mm_madd_epi16(src_t1_8x16b, coeff2_3_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 914 res_t3_4x32b = _mm_madd_epi16(src_t2_8x16b, coeff4_5_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 1091 res_t1_4x32b = _mm_madd_epi16(src_r0r1_8x16b, coeff0_1_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 1092 res_t2_4x32b = _mm_madd_epi16(src_r2r3_8x16b, coeff2_3_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 1093 res_t3_4x32b = _mm_madd_epi16(src_r4r5_8x16b, coeff4_5_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() 1104 res_t1_4x32b = _mm_madd_epi16(src_r0r1_8x16b, coeff0_1_8x16b); in ih264_inter_pred_luma_horz_hpel_vert_hpel_ssse3() [all …]
|
D | ih264_iquant_itrans_recon_ssse3.c | 150 …temp4 = _mm_madd_epi16(src_r0, temp4); //a00*b00*q00 a10*b10*q10 a20*b20*q20 a30*b30 q30 -- 32 bit… in ih264_iquant_itrans_recon_4x4_ssse3() 151 temp5 = _mm_madd_epi16(src_r1, temp5); in ih264_iquant_itrans_recon_4x4_ssse3() 152 temp6 = _mm_madd_epi16(src_r2, temp6); in ih264_iquant_itrans_recon_4x4_ssse3() 153 temp7 = _mm_madd_epi16(src_r3, temp7); in ih264_iquant_itrans_recon_4x4_ssse3() 421 …temp5 = _mm_madd_epi16(src_r0_1, scalemat_r0_1); // a00*b00*q0 a01*b01*q1 a02*b02*q2 a03*b03*q3 --… in ih264_iquant_itrans_recon_8x8_ssse3() 422 …temp7 = _mm_madd_epi16(src_r0_2, scalemat_r0_2); // a04*b04*q4 a05*b05*q5 a06*b06*q6 a07*b07*q7 --… in ih264_iquant_itrans_recon_8x8_ssse3() 443 …temp5 = _mm_madd_epi16(src_r0_1, scalemat_r0_1); // a00*b00*q0 a01*b01*q1 a02*b02*q2 a03*b03*q3 --… in ih264_iquant_itrans_recon_8x8_ssse3() 444 …temp7 = _mm_madd_epi16(src_r0_2, scalemat_r0_2); // a04*b04*q4 a05*b05*q5 a06*b06*q6 a07*b07*q7 --… in ih264_iquant_itrans_recon_8x8_ssse3() 464 …temp5 = _mm_madd_epi16(src_r0_1, scalemat_r0_1); // a00*b00*q0 a01*b01*q1 a02*b02*q2 a03*b03*q3 --… in ih264_iquant_itrans_recon_8x8_ssse3() 465 …temp7 = _mm_madd_epi16(src_r0_2, scalemat_r0_2); // a04*b04*q4 a05*b05*q5 a06*b06*q6 a07*b07*q7 --… in ih264_iquant_itrans_recon_8x8_ssse3() [all …]
|
D | ih264_ihadamard_scaling_ssse3.c | 180 src_r0 = _mm_madd_epi16(src_r0, mult_val); in ih264_ihadamard_scaling_4x4_ssse3() 181 src_r1 = _mm_madd_epi16(src_r1, mult_val); in ih264_ihadamard_scaling_4x4_ssse3() 182 src_r2 = _mm_madd_epi16(src_r2, mult_val); in ih264_ihadamard_scaling_4x4_ssse3() 183 src_r3 = _mm_madd_epi16(src_r3, mult_val); in ih264_ihadamard_scaling_4x4_ssse3()
|
D | ih264_iquant_itrans_recon_sse42.c | 149 …temp4 = _mm_madd_epi16(src_r0, temp4); //a00*b00*q00 a10*b10*q10 a20*b20*q20 a30*b30 q30 -- 32 bit… in ih264_iquant_itrans_recon_4x4_sse42() 150 temp5 = _mm_madd_epi16(src_r1, temp5); in ih264_iquant_itrans_recon_4x4_sse42() 151 temp6 = _mm_madd_epi16(src_r2, temp6); in ih264_iquant_itrans_recon_4x4_sse42() 152 temp7 = _mm_madd_epi16(src_r3, temp7); in ih264_iquant_itrans_recon_4x4_sse42() 400 …temp4 = _mm_madd_epi16(src_r0, temp4); //a00*b00*q00 a10*b10*q10 a20*b20*q20 a30*b30 q30 -- 32 bit… in ih264_iquant_itrans_recon_chroma_4x4_sse42() 401 temp5 = _mm_madd_epi16(src_r1, temp5); in ih264_iquant_itrans_recon_chroma_4x4_sse42() 402 temp6 = _mm_madd_epi16(src_r2, temp6); in ih264_iquant_itrans_recon_chroma_4x4_sse42() 403 temp7 = _mm_madd_epi16(src_r3, temp7); in ih264_iquant_itrans_recon_chroma_4x4_sse42()
|
D | ih264_chroma_intra_pred_filters_ssse3.c | 289 h_val_4x32b = _mm_madd_epi16(mul_8x16b, h_val1_8x16b); in ih264_intra_pred_chroma_8x8_mode_plane_ssse3() 290 v_val_4x32b = _mm_madd_epi16(mul_8x16b, v_val1_8x16b); in ih264_intra_pred_chroma_8x8_mode_plane_ssse3()
|
/external/neven/Embedded/common/src/b_BasicEm/ |
D | MathSSE2.c | 63 m_XMM0 = _mm_madd_epi16( m_XMM0, m_XMM1 ); in bbs_dotProduct_64SSE2() 68 m_XMM2 = _mm_madd_epi16( m_XMM2, m_XMM3 ); in bbs_dotProduct_64SSE2() 76 m_XMM4 = _mm_madd_epi16( m_XMM4, m_XMM5 ); in bbs_dotProduct_64SSE2() 79 m_XMM6 = _mm_madd_epi16( m_XMM6, m_XMM8 ); in bbs_dotProduct_64SSE2() 172 m_XMM0 = _mm_madd_epi16( m_XMM0, m_XMM2 ); in bbs_dotProduct_128SSE2() 178 m_XMM6 = _mm_madd_epi16( m_XMM6, m_XMM3 ); in bbs_dotProduct_128SSE2() 276 m_XMM0 = _mm_madd_epi16( m_XMM0, m_XMM2 ); in bbs_dotProduct_u128SSE2() 282 m_XMM6 = _mm_madd_epi16( m_XMM6, m_XMM3 ); in bbs_dotProduct_u128SSE2()
|
/external/webp/src/dsp/ |
D | enc_sse2.c | 394 const __m128i tmp0 = _mm_madd_epi16(a01, k88p); // [ (a0 + a1) << 3, ... ] in FTransform() 395 const __m128i tmp2 = _mm_madd_epi16(a01, k88m); // [ (a0 - a1) << 3, ... ] in FTransform() 396 const __m128i tmp1_1 = _mm_madd_epi16(a32, k5352_2217p); in FTransform() 397 const __m128i tmp3_1 = _mm_madd_epi16(a32, k5352_2217m); in FTransform() 434 const __m128i c1 = _mm_madd_epi16(b23, k5352_2217); in FTransform() 435 const __m128i c3 = _mm_madd_epi16(b23, k2217_5352); in FTransform() 532 const __m128i low_madd0 = _mm_madd_epi16(low0, low0); in SSE_Nx4() 533 const __m128i low_madd1 = _mm_madd_epi16(low1, low1); in SSE_Nx4() 534 const __m128i low_madd2 = _mm_madd_epi16(low2, low2); in SSE_Nx4() 535 const __m128i low_madd3 = _mm_madd_epi16(low3, low3); in SSE_Nx4() [all …]
|
/external/jpeg/ |
D | jidctintelsse.c | 132 …tmp1 = _mm_madd_epi16(tmp1, * ( __m128i*)table1); /*x2*w13+x0*w12, x2*w9+x0*w8, x2*w5+x0*w4, … in jpeg_idct_intelsse() 133 tmp5 = _mm_madd_epi16(tmp5, * ( __m128i*)table2); \ in jpeg_idct_intelsse() 140 …tmp3 = _mm_madd_epi16(tmp3, * ( __m128i*)(table1+16)); /*x3*w29+x1*w28, x3*w25+x1*w24, x3*w21+x1*w… in jpeg_idct_intelsse() 141 tmp7 = _mm_madd_epi16(tmp7, * ( __m128i*)(table2+16) ); \ in jpeg_idct_intelsse() 142 …row0 = _mm_madd_epi16(row0, * ( __m128i*)(table1+24)); /*x7*w31+x5*w30, x7*w27+x5*w26, x7*w23+x5*w… in jpeg_idct_intelsse() 143 row2 = _mm_madd_epi16(row2, * ( __m128i*)(table2+24) ); \ in jpeg_idct_intelsse() 144 …tmp2 = _mm_madd_epi16(tmp2, * ( __m128i*)(table1+8) ); /*x6*w15+x4*w14, x6*w11+x4*w10, x6*w7+x4*w6… in jpeg_idct_intelsse() 145 tmp6 = _mm_madd_epi16(tmp6, * ( __m128i*)(table2+8) ); \ in jpeg_idct_intelsse()
|