/external/libvpx/libvpx/vpx_dsp/x86/ |
D | convolve_ssse3.h | 47 const __m128i x0 = _mm_maddubs_epi16(s[0], f[0]); in convolve8_8_ssse3() 48 const __m128i x1 = _mm_maddubs_epi16(s[1], f[1]); in convolve8_8_ssse3() 49 const __m128i x2 = _mm_maddubs_epi16(s[2], f[2]); in convolve8_8_ssse3() 50 const __m128i x3 = _mm_maddubs_epi16(s[3], f[3]); in convolve8_8_ssse3() 70 const __m128i x0 = _mm_maddubs_epi16(s[0], f[0]); in convolve8_8_even_offset_ssse3() 71 const __m128i x1 = _mm_maddubs_epi16(s[1], f[1]); in convolve8_8_even_offset_ssse3() 72 const __m128i x2 = _mm_maddubs_epi16(s[2], f[2]); in convolve8_8_even_offset_ssse3() 73 const __m128i x3 = _mm_maddubs_epi16(s[3], f[3]); in convolve8_8_even_offset_ssse3() 75 const __m128i x4 = _mm_maddubs_epi16(s[1], _mm_set1_epi8(64)); in convolve8_8_even_offset_ssse3() 91 const __m128i x0 = _mm_maddubs_epi16(s[0], f[0]); in convolve8_8_odd_offset_ssse3() [all …]
|
D | vpx_subpixel_8t_intrin_ssse3.c | 88 srcRegFilt1 = _mm_maddubs_epi16(srcRegFilt1, firstFilters); in vpx_filter_block1d4_h8_intrin_ssse3() 89 srcRegFilt2 = _mm_maddubs_epi16(srcRegFilt2, secondFilters); in vpx_filter_block1d4_h8_intrin_ssse3() 249 tmp_0 = _mm_maddubs_epi16(src_reg_shift_0, kernel_reg_23); in vpx_filter_block1d16_h4_ssse3() 250 tmp_1 = _mm_maddubs_epi16(src_reg_shift_2, kernel_reg_45); in vpx_filter_block1d16_h4_ssse3() 260 tmp_0 = _mm_maddubs_epi16(src_reg_shift_0, kernel_reg_23); in vpx_filter_block1d16_h4_ssse3() 261 tmp_1 = _mm_maddubs_epi16(src_reg_shift_2, kernel_reg_45); in vpx_filter_block1d16_h4_ssse3() 347 res_reg_m10_lo = _mm_maddubs_epi16(src_reg_m10_lo, kernel_reg_23); in vpx_filter_block1d16_v4_ssse3() 348 res_reg_01_lo = _mm_maddubs_epi16(src_reg_01_lo, kernel_reg_23); in vpx_filter_block1d16_v4_ssse3() 350 res_reg_12_lo = _mm_maddubs_epi16(src_reg_12_lo, kernel_reg_45); in vpx_filter_block1d16_v4_ssse3() 351 res_reg_23_lo = _mm_maddubs_epi16(src_reg_23_lo, kernel_reg_45); in vpx_filter_block1d16_v4_ssse3() [all …]
|
D | convolve_avx2.h | 80 const __m128i x0 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[0]), in convolve8_8_avx2() 82 const __m128i x1 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[1]), in convolve8_8_avx2() 84 const __m128i x2 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[2]), in convolve8_8_avx2() 86 const __m128i x3 = _mm_maddubs_epi16(_mm256_castsi256_si128(s[3]), in convolve8_8_avx2()
|
/external/libhevc/common/x86/ |
D | ihevc_inter_pred_filters_ssse3_intr.c | 336 … res_temp1_8x16b = _mm_maddubs_epi16(src_temp3_16x8b, coeff0_1_8x16b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 342 … res_temp2_8x16b = _mm_maddubs_epi16(src_temp4_16x8b, coeff2_3_8x16b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 348 … res_temp3_8x16b = _mm_maddubs_epi16(src_temp5_16x8b, coeff4_5_8x16b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 354 … res_temp4_8x16b = _mm_maddubs_epi16(src_temp6_16x8b, coeff6_7_8x16b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 369 … res_temp11_8x16b = _mm_maddubs_epi16(src_temp13_16x8b, coeff0_1_8x16b); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() 375 … res_temp12_8x16b = _mm_maddubs_epi16(src_temp14_16x8b, coeff2_3_8x16b); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() 381 … res_temp13_8x16b = _mm_maddubs_epi16(src_temp15_16x8b, coeff4_5_8x16b); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() 387 … res_temp14_8x16b = _mm_maddubs_epi16(src_temp16_16x8b, coeff6_7_8x16b); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() 425 … res_temp1_8x16b = _mm_maddubs_epi16(src_temp3_16x8b, coeff0_1_8x16b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 431 … res_temp2_8x16b = _mm_maddubs_epi16(src_temp4_16x8b, coeff2_3_8x16b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() [all …]
|
D | ihevc_intra_pred_filters_ssse3_intr.c | 754 res_temp_8x16b = _mm_maddubs_epi16(pu1_ref_16x8b, row_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 755 res_temp1_8x16b = _mm_maddubs_epi16(pu1_ref_16x8b, row1_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 756 res_temp2_8x16b = _mm_maddubs_epi16(pu1_ref_16x8b, row2_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 757 res_temp3_8x16b = _mm_maddubs_epi16(pu1_ref_16x8b, row3_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 759 res_temp4_8x16b = _mm_maddubs_epi16(res_temp4_8x16b, nt_row_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 760 res_temp5_8x16b = _mm_maddubs_epi16(res_temp5_8x16b, nt_row1_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 761 res_temp6_8x16b = _mm_maddubs_epi16(res_temp6_8x16b, nt_row2_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 762 res_temp7_8x16b = _mm_maddubs_epi16(res_temp7_8x16b, nt_row3_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 832 res_temp_8x16b = _mm_maddubs_epi16(pu1_ref_16x8b, row_16x8b); in ihevc_intra_pred_luma_planar_ssse3() 833 res_temp1_8x16b = _mm_maddubs_epi16(pu1_ref_16x8b, row1_16x8b); in ihevc_intra_pred_luma_planar_ssse3() [all …]
|
D | ihevc_intra_pred_filters_sse42_intr.c | 1515 src_temp1_8x16b = _mm_maddubs_epi16(src_temp1_8x16b, temp1_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1516 src_temp2_8x16b = _mm_maddubs_epi16(src_temp2_8x16b, temp2_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1517 src_temp3_8x16b = _mm_maddubs_epi16(src_temp3_8x16b, temp3_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1518 src_temp4_8x16b = _mm_maddubs_epi16(src_temp4_8x16b, temp4_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1654 src_temp1_8x16b = _mm_maddubs_epi16(src_temp1_8x16b, temp1_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1655 src_temp2_8x16b = _mm_maddubs_epi16(src_temp2_8x16b, temp2_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1656 src_temp3_8x16b = _mm_maddubs_epi16(src_temp3_8x16b, temp3_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1657 src_temp4_8x16b = _mm_maddubs_epi16(src_temp4_8x16b, temp4_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1660 src_temp11_8x16b = _mm_maddubs_epi16(src_temp11_8x16b, temp11_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() 1661 src_temp12_8x16b = _mm_maddubs_epi16(src_temp12_8x16b, temp12_8x16b); in ihevc_intra_pred_luma_mode_3_to_9_sse42() [all …]
|
D | ihevc_chroma_intra_pred_filters_ssse3_intr.c | 1278 src_temp1_8x16b = _mm_maddubs_epi16(src_temp1_8x16b, temp1_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1279 src_temp2_8x16b = _mm_maddubs_epi16(src_temp2_8x16b, temp2_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1280 src_temp3_8x16b = _mm_maddubs_epi16(src_temp3_8x16b, temp3_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1281 src_temp4_8x16b = _mm_maddubs_epi16(src_temp4_8x16b, temp4_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1446 src_temp1_8x16b = _mm_maddubs_epi16(src_temp1_8x16b, temp1_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1447 src_temp2_8x16b = _mm_maddubs_epi16(src_temp2_8x16b, temp2_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1448 src_temp3_8x16b = _mm_maddubs_epi16(src_temp3_8x16b, temp3_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1449 src_temp4_8x16b = _mm_maddubs_epi16(src_temp4_8x16b, temp4_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1452 src_temp11_8x16b = _mm_maddubs_epi16(src_temp11_8x16b, temp11_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() 1453 src_temp12_8x16b = _mm_maddubs_epi16(src_temp12_8x16b, temp12_8x16b); in ihevc_intra_pred_chroma_mode_3_to_9_ssse3() [all …]
|
D | ihevc_deblk_ssse3_intr.c | 153 mask_d_result_4x32b = _mm_maddubs_epi16(src_tmp_8x16b, coef_8x16b); in ihevc_deblk_luma_vert_ssse3() 166 mask_de_result_8x16b = _mm_maddubs_epi16(mask_de_result_8x16b, temp_coef0_8x16b); in ihevc_deblk_luma_vert_ssse3() 274 temp_pq_str0_16x8b = _mm_maddubs_epi16(temp_pq_str0_16x8b, const2_8x16b); in ihevc_deblk_luma_vert_ssse3() 290 temp_pq1_str0_16x8b = _mm_maddubs_epi16(temp_pq1_str0_16x8b, const2_8x16b); in ihevc_deblk_luma_vert_ssse3() 291 temp_pq1_str1_16x8b = _mm_maddubs_epi16(temp_pq1_str1_16x8b, const2_8x16b); in ihevc_deblk_luma_vert_ssse3() 319 temp_pq2_str0_16x8b = _mm_maddubs_epi16(temp_str3_16x8b, const2_8x16b); in ihevc_deblk_luma_vert_ssse3() 411 tmp_delta3_8x16b = _mm_maddubs_epi16(tmp_delta2_8x16b, coefdelta_0_8x16b); in ihevc_deblk_luma_vert_ssse3() 433 tmp_delta3_8x16b = _mm_maddubs_epi16(tmp_delta2_8x16b, coefdelta_0_8x16b); in ihevc_deblk_luma_vert_ssse3() 613 mask_d_result_4x32b = _mm_maddubs_epi16(src_tmp_p_0_8x16b, coef_8x16b); in ihevc_deblk_luma_horz_ssse3() 626 mask_de_result_8x16b = _mm_maddubs_epi16(mask_de_result_8x16b, temp_coef0_8x16b); in ihevc_deblk_luma_horz_ssse3() [all …]
|
/external/libavc/common/x86/ |
D | ih264_inter_pred_filters_ssse3.c | 262 …res_r0r1_t1_8x16b = _mm_maddubs_epi16(src_r0r1_16x8b, coeff0_1_16x8b); //a0*c0+a1*c1 a1*c0+a2*c1 … in ih264_inter_pred_luma_horz_ssse3() 269 …res_r0r1_t2_8x16b = _mm_maddubs_epi16(src_r0r1_16x8b, coeff2_3_16x8b); //a2*c2+a3*c3 a3*c2+a4*c3 … in ih264_inter_pred_luma_horz_ssse3() 276 …res_r0r1_t3_8x16b = _mm_maddubs_epi16(src_r0r1_16x8b, coeff4_5_16x8b); //a4*c4+a5*c5 a5*c4+a6*c5 … in ih264_inter_pred_luma_horz_ssse3() 326 …res_r0_t1_8x16b = _mm_maddubs_epi16(src_r0_t1_16x8b, coeff0_1_16x8b); //a0*c0+a1*c1 a1*c0+a2*c1 a2… in ih264_inter_pred_luma_horz_ssse3() 328 …res_r1_t1_8x16b = _mm_maddubs_epi16(src_r1_t1_16x8b, coeff0_1_16x8b); //b0*c0+b1*c1 b1*c0+b2*c1 b2… in ih264_inter_pred_luma_horz_ssse3() 340 …res_r0_t2_8x16b = _mm_maddubs_epi16(src_r0_t1_16x8b, coeff2_3_16x8b); //a2*c2+a3*c3 a3*c2+a4*c3 a4… in ih264_inter_pred_luma_horz_ssse3() 342 …res_r1_t2_8x16b = _mm_maddubs_epi16(src_r1_t1_16x8b, coeff2_3_16x8b); //b2*c2+b3*c3 b3*c2+b4*c3 b2… in ih264_inter_pred_luma_horz_ssse3() 354 …res_r0_t3_8x16b = _mm_maddubs_epi16(src_r0_t1_16x8b, coeff4_5_16x8b); //a4*c4+a5*c5 a5*c4+a6*c5 a6… in ih264_inter_pred_luma_horz_ssse3() 356 …res_r1_t3_8x16b = _mm_maddubs_epi16(src_r1_t1_16x8b, coeff4_5_16x8b); //b4*c4+b5*c5 b5*c4+b6*c5 b6… in ih264_inter_pred_luma_horz_ssse3() 403 …res_r0_t1_8x16b = _mm_maddubs_epi16(src_r0_t1_16x8b, coeff0_1_16x8b); //a0*c0+a1*c1 a1*c0+a2*c1 a2… in ih264_inter_pred_luma_horz_ssse3() [all …]
|
/external/libaom/libaom/aom_dsp/x86/ |
D | aom_subpixel_8t_intrin_ssse3.c | 93 srcRegFilt32b1_1 = _mm_maddubs_epi16(srcRegFilt32b1_1, firstFilters); in aom_filter_block1d4_h4_ssse3() 164 resReglo = _mm_maddubs_epi16(srcReg2345_3456_lo, firstFilters); in aom_filter_block1d4_v4_ssse3() 165 resReghi = _mm_maddubs_epi16(srcReg2345_3456_hi, firstFilters); in aom_filter_block1d4_v4_ssse3() 233 srcRegFilt1 = _mm_maddubs_epi16(srcRegFilt1, firstFilters); in aom_filter_block1d4_h8_intrin_ssse3() 234 srcRegFilt2 = _mm_maddubs_epi16(srcRegFilt2, secondFilters); in aom_filter_block1d4_h8_intrin_ssse3() 298 srcRegFilt32b3 = _mm_maddubs_epi16(srcRegFilt32b3, secondFilters); in aom_filter_block1d8_h4_ssse3() 299 srcRegFilt32b2 = _mm_maddubs_epi16(srcRegFilt32b2, thirdFilters); in aom_filter_block1d8_h4_ssse3() 367 resReg23 = _mm_maddubs_epi16(srcReg23, secondFilters); in aom_filter_block1d8_v4_ssse3() 368 resReg34 = _mm_maddubs_epi16(srcReg34, secondFilters); in aom_filter_block1d8_v4_ssse3() 369 resReg45 = _mm_maddubs_epi16(srcReg45, thirdFilters); in aom_filter_block1d8_v4_ssse3() [all …]
|
D | aom_subpixel_8t_intrin_avx2.c | 141 _mm_maddubs_epi16(srcRegFilt1_1, _mm256_castsi256_si128(firstFilters)); in aom_filter_block1d4_h4_avx2() 238 _mm_maddubs_epi16(srcRegFilt1_1, _mm256_castsi256_si128(firstFilters)); in aom_filter_block1d4_h8_avx2() 245 _mm_maddubs_epi16(srcRegFilt2, _mm256_castsi256_si128(secondFilters)); in aom_filter_block1d4_h8_avx2() 337 _mm_maddubs_epi16(srcRegFilt2, _mm256_castsi256_si128(secondFilters)); in aom_filter_block1d8_h4_avx2() 339 _mm_maddubs_epi16(srcRegFilt3, _mm256_castsi256_si128(thirdFilters)); in aom_filter_block1d8_h4_avx2() 453 _mm_maddubs_epi16(srcRegFilt1_1, _mm256_castsi256_si128(firstFilters)); in aom_filter_block1d8_h8_avx2() 455 _mm_maddubs_epi16(srcRegFilt2, _mm256_castsi256_si128(forthFilters)); in aom_filter_block1d8_h8_avx2() 466 _mm_maddubs_epi16(srcRegFilt3, _mm256_castsi256_si128(secondFilters)); in aom_filter_block1d8_h8_avx2() 468 _mm_maddubs_epi16(srcRegFilt2, _mm256_castsi256_si128(thirdFilters)); in aom_filter_block1d8_h8_avx2() 729 _mm_maddubs_epi16(srcRegFilt1_1, _mm256_castsi256_si128(firstFilters)); in aom_filter_block1d16_h8_avx2() [all …]
|
D | masked_variance_intrin_ssse3.h | 42 const __m128i blendAL = _mm_maddubs_epi16(ssAL, aaAL); in comp_mask_pred_16_ssse3() 43 const __m128i blendAH = _mm_maddubs_epi16(ssAH, aaAH); in comp_mask_pred_16_ssse3() 77 const __m128i blendA = _mm_maddubs_epi16(ssA, aaA); in comp_mask_pred_8_ssse3() 78 const __m128i blendB = _mm_maddubs_epi16(ssB, aaB); in comp_mask_pred_8_ssse3()
|
D | blend_sse4.h | 64 const __m128i v_p0_w = _mm_maddubs_epi16(_mm_unpacklo_epi8(v_s0_b, v_s1_b), in blend_4_u8() 78 const __m128i v_p0_w = _mm_maddubs_epi16(_mm_unpacklo_epi8(v_s0_b, v_s1_b), in blend_8_u8() 92 const __m128i v_p0_w = _mm_maddubs_epi16(_mm_unpacklo_epi8(v_s0_b, v_s1_b), in blend_16_u8() 94 const __m128i v_p1_w = _mm_maddubs_epi16(_mm_unpackhi_epi8(v_s0_b, v_s1_b), in blend_16_u8()
|
D | blend_mask_sse4.h | 113 const __m128i m_acbd = _mm_maddubs_epi16(m_ac, one_b); in aom_lowbd_blend_a64_d16_mask_subw1_subh1_w4_sse4_1() 138 const __m128i m_acbd = _mm_maddubs_epi16(m_ac, one_b); in aom_lowbd_blend_a64_d16_mask_subw1_subh1_w8_sse4_1() 161 const __m128i m_ac = _mm_maddubs_epi16(m_i0, one_b); in aom_lowbd_blend_a64_d16_mask_subw1_subh0_w4_sse4_1() 183 const __m128i m_ac = _mm_maddubs_epi16(m_i0, one_b); in aom_lowbd_blend_a64_d16_mask_subw1_subh0_w8_sse4_1()
|
D | masked_sad_intrin_ssse3.c | 117 __m128i pred_l = _mm_maddubs_epi16(data_l, mask_l); in masked_sad_ssse3() 122 __m128i pred_r = _mm_maddubs_epi16(data_r, mask_r); in masked_sad_ssse3() 164 __m128i pred_l = _mm_maddubs_epi16(data_l, mask_l); in aom_masked_sad8xh_ssse3() 169 __m128i pred_r = _mm_maddubs_epi16(data_r, mask_r); in aom_masked_sad8xh_ssse3() 213 __m128i pred_16bit = _mm_maddubs_epi16(data, mask); in aom_masked_sad4xh_ssse3()
|
D | variance_impl_ssse3.c | 48 __m128i res = _mm_maddubs_epi16(source, filters); in aom_var_filter_block2d_bil_first_pass_ssse3() 74 __m128i res = _mm_maddubs_epi16(source_shuffle, filters); in aom_var_filter_block2d_bil_first_pass_ssse3()
|
D | jnt_variance_ssse3.c | 36 __m128i mult_lo = _mm_maddubs_epi16(p_lo, *w); in compute_dist_wtd_avg() 41 __m128i mult_hi = _mm_maddubs_epi16(p_hi, *w); in compute_dist_wtd_avg()
|
D | masked_variance_intrin_ssse3.c | 139 v0 = _mm_maddubs_epi16(v0, filter); in filter_block() 143 v1 = _mm_maddubs_epi16(v1, filter); in filter_block() 225 v0 = _mm_maddubs_epi16(v0, *filter); in filter_block_2rows() 229 v1 = _mm_maddubs_epi16(v1, *filter); in filter_block_2rows() 276 v0 = _mm_maddubs_epi16(v0, hfilter_vec); in bilinear_filter8xh() 357 v0 = _mm_maddubs_epi16(v0, hfilter_vec); in bilinear_filter4xh() 408 __m128i pred_l = _mm_maddubs_epi16(data_l, mask_l); in accumulate_block() 413 __m128i pred_r = _mm_maddubs_epi16(data_r, mask_r); in accumulate_block()
|
D | blend_a64_mask_sse4.c | 942 const __m128i m0_acbd = _mm_maddubs_epi16(m0_ac, one_b); in lowbd_blend_a64_d16_mask_subw1_subh1_w16_sse4_1() 943 const __m128i m1_acbd = _mm_maddubs_epi16(m1_ac, one_b); in lowbd_blend_a64_d16_mask_subw1_subh1_w16_sse4_1() 969 const __m128i m0_ac = _mm_maddubs_epi16(m_i00, one_b); in lowbd_blend_a64_d16_mask_subw1_subh0_w16_sse4_1() 970 const __m128i m1_ac = _mm_maddubs_epi16(m_i01, one_b); in lowbd_blend_a64_d16_mask_subw1_subh0_w16_sse4_1() 1224 const __m128i m0123 = _mm_maddubs_epi16(_mm_adds_epu8(m02, m13), one_b); in highbd_blend_a64_d16_mask_subw1_subh1_w4_sse4_1() 1230 const __m128i m4567 = _mm_maddubs_epi16(_mm_adds_epu8(m46, m57), one_b); in highbd_blend_a64_d16_mask_subw1_subh1_w4_sse4_1() 1342 const __m128i mask_16a = _mm_maddubs_epi16(mask_bothrowsa, one_b); in highbd_blend_a64_d16_mask_subw1_subh1_w8_sse4_1() 1343 const __m128i mask_16b = _mm_maddubs_epi16(mask_bothrowsb, one_b); in highbd_blend_a64_d16_mask_subw1_subh1_w8_sse4_1() 1464 const __m128i m0_acbd = _mm_maddubs_epi16(m0_ac, one_b); in highbd_blend_a64_d16_mask_subw1_subh1_w16_sse4_1() 1465 const __m128i m1_acbd = _mm_maddubs_epi16(m1_ac, one_b); in highbd_blend_a64_d16_mask_subw1_subh1_w16_sse4_1()
|
/external/libavc/encoder/x86/ |
D | ih264e_half_pel_ssse3.c | 141 …res_r0_t1_8x16b = _mm_maddubs_epi16(src_r0_t1_16x8b, coeff0_1_16x8b); //a0*c0+a1*c1 a1*c0+a2*c1… in ih264e_sixtapfilter_horz_ssse3() 143 …res_r1_t1_8x16b = _mm_maddubs_epi16(src_r1_t1_16x8b, coeff0_1_16x8b); //b0*c0+b1*c1 b1*c0+b2*c1… in ih264e_sixtapfilter_horz_ssse3() 155 …res_r0_t2_8x16b = _mm_maddubs_epi16(src_r0_t1_16x8b, coeff2_3_16x8b); //a2*c2+a3*c3 a3*c2+a4*c3… in ih264e_sixtapfilter_horz_ssse3() 157 …res_r1_t2_8x16b = _mm_maddubs_epi16(src_r1_t1_16x8b, coeff2_3_16x8b); //b2*c2+b3*c3 b3*c2+b4*c3… in ih264e_sixtapfilter_horz_ssse3() 169 …res_r0_t3_8x16b = _mm_maddubs_epi16(src_r0_t1_16x8b, coeff4_5_16x8b); //a4*c4+a5*c5 a5*c4+a6*c5… in ih264e_sixtapfilter_horz_ssse3() 171 …res_r1_t3_8x16b = _mm_maddubs_epi16(src_r1_t1_16x8b, coeff4_5_16x8b); //b4*c4+b5*c5 b5*c4+b6*c5… in ih264e_sixtapfilter_horz_ssse3() 312 res_t1_8x16b = _mm_maddubs_epi16(src_r0r1_16x8b, coeff0_1_16x8b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 313 res_t2_8x16b = _mm_maddubs_epi16(src_r2r3_16x8b, coeff2_3_16x8b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 314 res_t3_8x16b = _mm_maddubs_epi16(src_r4r5_16x8b, coeff4_5_16x8b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 325 res_t1_8x16b = _mm_maddubs_epi16(src_r0r1_16x8b, coeff0_1_16x8b); in ih264e_sixtap_filter_2dvh_vert_ssse3() [all …]
|
/external/libaom/libaom/av1/common/x86/ |
D | cfl_ssse3.c | 51 top = _mm_maddubs_epi16(top, twos); in cfl_luma_subsampling_420_lbd_ssse3() 53 bot = _mm_maddubs_epi16(bot, twos); in cfl_luma_subsampling_420_lbd_ssse3() 58 top = _mm_maddubs_epi16(top, twos); in cfl_luma_subsampling_420_lbd_ssse3() 60 bot = _mm_maddubs_epi16(bot, twos); in cfl_luma_subsampling_420_lbd_ssse3() 65 top = _mm_maddubs_epi16(top, twos); in cfl_luma_subsampling_420_lbd_ssse3() 67 bot = _mm_maddubs_epi16(bot, twos); in cfl_luma_subsampling_420_lbd_ssse3() 74 top_1 = _mm_maddubs_epi16(top_1, twos); in cfl_luma_subsampling_420_lbd_ssse3() 75 bot_1 = _mm_maddubs_epi16(bot_1, twos); in cfl_luma_subsampling_420_lbd_ssse3() 105 top = _mm_maddubs_epi16(top, fours); in cfl_luma_subsampling_422_lbd_ssse3() 109 top = _mm_maddubs_epi16(top, fours); in cfl_luma_subsampling_422_lbd_ssse3() [all …]
|
D | intra_edge_sse4.c | 58 d0 = _mm_maddubs_epi16(d0, coef0); in av1_filter_intra_edge_sse4_1() 59 d1 = _mm_maddubs_epi16(d1, coef0); in av1_filter_intra_edge_sse4_1() 91 d0 = _mm_maddubs_epi16(d0, coef0); in av1_filter_intra_edge_sse4_1() 92 d1 = _mm_maddubs_epi16(d1, coef0); in av1_filter_intra_edge_sse4_1() 93 d2 = _mm_maddubs_epi16(d2, coef0); in av1_filter_intra_edge_sse4_1() 94 d3 = _mm_maddubs_epi16(d3, coef0); in av1_filter_intra_edge_sse4_1() 243 d0 = _mm_maddubs_epi16(d0, coef0); in av1_upsample_intra_edge_sse4_1() 244 d1 = _mm_maddubs_epi16(d1, coef0); in av1_upsample_intra_edge_sse4_1() 245 d2 = _mm_maddubs_epi16(d2, coef0); in av1_upsample_intra_edge_sse4_1() 246 d3 = _mm_maddubs_epi16(d3, coef0); in av1_upsample_intra_edge_sse4_1()
|
D | filterintra_sse4.c | 53 const __m128i out_01 = _mm_maddubs_epi16(in, f1f0); in av1_filter_intra_predictor_sse4_1() 54 const __m128i out_23 = _mm_maddubs_epi16(in, f3f2); in av1_filter_intra_predictor_sse4_1() 55 const __m128i out_45 = _mm_maddubs_epi16(in, f5f4); in av1_filter_intra_predictor_sse4_1() 56 const __m128i out_67 = _mm_maddubs_epi16(in, f7f6); in av1_filter_intra_predictor_sse4_1()
|
D | warp_plane_sse4.c | 238 const __m128i res_02 = _mm_maddubs_epi16(src_02, coeff[0]); in filter_src_pixels() 242 const __m128i res_46 = _mm_maddubs_epi16(src_46, coeff[1]); in filter_src_pixels() 246 const __m128i res_13 = _mm_maddubs_epi16(src_13, coeff[2]); in filter_src_pixels() 250 const __m128i res_57 = _mm_maddubs_epi16(src_57, coeff[3]); in filter_src_pixels()
|
/external/clang/test/CodeGen/ |
D | ssse3-builtins.c | 79 return _mm_maddubs_epi16(a, b); in test_mm_maddubs_epi16()
|