/external/libhevc/common/x86/ |
D | ihevc_weighted_pred_sse42_intr.c | 182 src_temp0_4x32b = _mm_mullo_epi32(src_temp0_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 183 src_temp1_4x32b = _mm_mullo_epi32(src_temp1_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 184 src_temp2_4x32b = _mm_mullo_epi32(src_temp2_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 185 src_temp3_4x32b = _mm_mullo_epi32(src_temp3_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 200 src_temp4_4x32b = _mm_mullo_epi32(src_temp4_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 201 src_temp5_4x32b = _mm_mullo_epi32(src_temp5_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 202 src_temp6_4x32b = _mm_mullo_epi32(src_temp6_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 203 src_temp7_4x32b = _mm_mullo_epi32(src_temp7_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 298 src_temp0_4x32b = _mm_mullo_epi32(src_temp0_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() 299 src_temp1_4x32b = _mm_mullo_epi32(src_temp1_4x32b, wgt0_4x32b); in ihevc_weighted_pred_uni_sse42() [all …]
|
D | ihevc_itrans_recon_sse42_intr.c | 177 m_temp_reg_13 = _mm_mullo_epi32(m_temp_reg_1, m_coeff3); in ihevc_itrans_recon_4x4_ttype1_sse42() 206 m_temp_reg_30 = _mm_mullo_epi32(m_temp_reg_10, m_coeff1); //29*c0 in ihevc_itrans_recon_4x4_ttype1_sse42() 207 m_temp_reg_31 = _mm_mullo_epi32(m_temp_reg_11, m_coeff2); //55*c1 in ihevc_itrans_recon_4x4_ttype1_sse42() 211 m_temp_reg_32 = _mm_mullo_epi32(m_temp_reg_11, m_coeff1); //29*c1 in ihevc_itrans_recon_4x4_ttype1_sse42() 212 m_temp_reg_33 = _mm_mullo_epi32(m_temp_reg_12, m_coeff2); //55*c2 in ihevc_itrans_recon_4x4_ttype1_sse42() 216 m_temp_reg_34 = _mm_mullo_epi32(m_temp_reg_10, m_coeff2); //55*c0 in ihevc_itrans_recon_4x4_ttype1_sse42() 217 m_temp_reg_35 = _mm_mullo_epi32(m_temp_reg_12, m_coeff1); //29*c2 in ihevc_itrans_recon_4x4_ttype1_sse42() 218 m_temp_reg_36 = _mm_mullo_epi32(m_temp_reg_14, m_coeff3); //74*c4 in ihevc_itrans_recon_4x4_ttype1_sse42() 272 m_temp_reg_3 = _mm_mullo_epi32(m_temp_reg_22, m_coeff3); in ihevc_itrans_recon_4x4_ttype1_sse42() 297 m_temp_reg_30 = _mm_mullo_epi32(m_temp_reg_0, m_coeff1); //29*c0 in ihevc_itrans_recon_4x4_ttype1_sse42() [all …]
|
/external/flac/libFLAC/ |
D | lpc_intrin_sse41.c | 987 summ = _mm_mullo_epi32(q11, _mm_loadu_si128((const __m128i*)(data+i-12))); in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 988 …mull = _mm_mullo_epi32(q10, _mm_loadu_si128((const __m128i*)(data+i-11))); summ = _mm_add_epi32(su… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 989 …mull = _mm_mullo_epi32(q9, _mm_loadu_si128((const __m128i*)(data+i-10))); summ = _mm_add_epi32(sum… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 990 …mull = _mm_mullo_epi32(q8, _mm_loadu_si128((const __m128i*)(data+i-9))); summ = _mm_add_epi32(summ… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 991 …mull = _mm_mullo_epi32(q7, _mm_loadu_si128((const __m128i*)(data+i-8))); summ = _mm_add_epi32(summ… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 992 …mull = _mm_mullo_epi32(q6, _mm_loadu_si128((const __m128i*)(data+i-7))); summ = _mm_add_epi32(summ… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 993 …mull = _mm_mullo_epi32(q5, _mm_loadu_si128((const __m128i*)(data+i-6))); summ = _mm_add_epi32(summ… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 994 …mull = _mm_mullo_epi32(q4, _mm_loadu_si128((const __m128i*)(data+i-5))); summ = _mm_add_epi32(summ… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 995 …mull = _mm_mullo_epi32(q3, _mm_loadu_si128((const __m128i*)(data+i-4))); summ = _mm_add_epi32(summ… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() 996 …mull = _mm_mullo_epi32(q2, _mm_loadu_si128((const __m128i*)(data+i-3))); summ = _mm_add_epi32(summ… in FLAC__lpc_compute_residual_from_qlp_coefficients_intrin_sse41() [all …]
|
/external/libaom/libaom/av1/common/x86/ |
D | highbd_inv_txfm_sse4.c | 404 x = _mm_mullo_epi32(u0, cospi32); in idct4x4_sse4_1() 405 y = _mm_mullo_epi32(u2, cospi32); in idct4x4_sse4_1() 414 x = _mm_mullo_epi32(u1, cospi48); in idct4x4_sse4_1() 415 y = _mm_mullo_epi32(u3, cospim16); in idct4x4_sse4_1() 420 x = _mm_mullo_epi32(u1, cospi16); in idct4x4_sse4_1() 421 y = _mm_mullo_epi32(u3, cospi48); in idct4x4_sse4_1() 463 s0 = _mm_mullo_epi32(x0, sinpi1); in iadst4x4_sse4_1() 464 s1 = _mm_mullo_epi32(x0, sinpi2); in iadst4x4_sse4_1() 465 s2 = _mm_mullo_epi32(x1, sinpi3); in iadst4x4_sse4_1() 466 s3 = _mm_mullo_epi32(x2, sinpi4); in iadst4x4_sse4_1() [all …]
|
D | selfguided_sse4.c | 159 an = _mm_max_epi32(_mm_mullo_epi32(a, _mm_set1_epi32(n)), bb); in compute_p() 162 an = _mm_mullo_epi32(sum2, _mm_set1_epi32(n)); in compute_p() 213 _mm_srli_epi32(_mm_add_epi32(_mm_mullo_epi32(p, s), rnd_z), in calc_ab() 233 const __m128i b_int = _mm_mullo_epi32(a_comp_over_n, sum1); in calc_ab() 353 _mm_srli_epi32(_mm_add_epi32(_mm_mullo_epi32(p, s), rnd_z), in calc_ab_fast() 373 const __m128i b_int = _mm_mullo_epi32(a_comp_over_n, sum1); in calc_ab_fast() 625 v_0 = _mm_add_epi32(v_0, _mm_mullo_epi32(xq0, f1_0)); in apply_selfguided_restoration_sse4_1() 628 v_1 = _mm_add_epi32(v_1, _mm_mullo_epi32(xq0, f1_1)); in apply_selfguided_restoration_sse4_1() 633 v_0 = _mm_add_epi32(v_0, _mm_mullo_epi32(xq1, f2_0)); in apply_selfguided_restoration_sse4_1() 636 v_1 = _mm_add_epi32(v_1, _mm_mullo_epi32(xq1, f2_1)); in apply_selfguided_restoration_sse4_1()
|
D | av1_txfm_sse4.h | 55 const __m128i r1 = _mm_mullo_epi32(sqrt2, r0); in av1_round_shift_rect_array_32_sse4_1() 62 const __m128i r1 = _mm_mullo_epi32(sqrt2, r0); in av1_round_shift_rect_array_32_sse4_1()
|
D | highbd_txfm_utility_sse4.h | 103 x = _mm_mullo_epi32(*w0, *n0); in half_btf_sse4_1() 104 y = _mm_mullo_epi32(*w1, *n1); in half_btf_sse4_1() 115 x = _mm_mullo_epi32(*w0, *n0); in half_btf_0_sse4_1()
|
D | highbd_warp_plane_sse4.c | 541 res_lo = _mm_add_epi32(_mm_mullo_epi32(p_32, wt0), in av1_highbd_warp_affine_sse4_1() 542 _mm_mullo_epi32(res_lo, wt1)); in av1_highbd_warp_affine_sse4_1() 574 res_hi = _mm_add_epi32(_mm_mullo_epi32(p4_32, wt0), in av1_highbd_warp_affine_sse4_1() 575 _mm_mullo_epi32(res_hi, wt1)); in av1_highbd_warp_affine_sse4_1()
|
D | av1_convolve_scale_sse4.c | 412 shifted = _mm_add_epi32(_mm_mullo_epi32(p_32, wt0), in highbd_vfilter8() 413 _mm_mullo_epi32(shifted, wt1)); in highbd_vfilter8()
|
/external/libaom/libaom/av1/encoder/x86/ |
D | highbd_fwd_txfm_sse4.c | 81 u0 = _mm_mullo_epi32(s0, cospi32); in fdct4x4_sse4_1() 82 u1 = _mm_mullo_epi32(s1, cospi32); in fdct4x4_sse4_1() 93 v0 = _mm_mullo_epi32(s2, cospi48); in fdct4x4_sse4_1() 94 v1 = _mm_mullo_epi32(s3, cospi16); in fdct4x4_sse4_1() 100 v0 = _mm_mullo_epi32(s2, cospi16); in fdct4x4_sse4_1() 101 v1 = _mm_mullo_epi32(s3, cospi48); in fdct4x4_sse4_1() 143 s0 = _mm_mullo_epi32(in[idx], sinpi1); in fadst4x4_sse4_1() 144 s1 = _mm_mullo_epi32(in[idx], sinpi4); in fadst4x4_sse4_1() 147 s2 = _mm_mullo_epi32(in[idx], sinpi2); in fadst4x4_sse4_1() 148 s3 = _mm_mullo_epi32(in[idx], sinpi1); in fadst4x4_sse4_1() [all …]
|
D | av1_txfm1d_sse4.h | 100 const __m128i in0_w0 = _mm_mullo_epi32(in0, ww0); \ 101 const __m128i in1_w1 = _mm_mullo_epi32(in1, ww1); \ 104 const __m128i in0_w1 = _mm_mullo_epi32(in0, ww1); \ 105 const __m128i in1_w0 = _mm_mullo_epi32(in1, ww0); \ 121 const __m128i in0_w0 = _mm_mullo_epi32(in0, ww0); \ 122 const __m128i in1_w1 = _mm_mullo_epi32(in1, ww1); \ 126 const __m128i in0_w1 = _mm_mullo_epi32(in0, ww1); \ 127 const __m128i in1_w0 = _mm_mullo_epi32(in1, ww0); \
|
D | pickrst_sse4.c | 677 const __m128i v0l = _mm_mullo_epi32(flt0l_subu, xq0); in av1_highbd_pixel_proj_error_sse4_1() 678 const __m128i v0h = _mm_mullo_epi32(flt0h_subu, xq0); in av1_highbd_pixel_proj_error_sse4_1() 679 const __m128i v1l = _mm_mullo_epi32(flt1l_subu, xq1); in av1_highbd_pixel_proj_error_sse4_1() 680 const __m128i v1h = _mm_mullo_epi32(flt1h_subu, xq1); in av1_highbd_pixel_proj_error_sse4_1() 744 const __m128i flth_xq = _mm_mullo_epi32(flth, xq_active); in av1_highbd_pixel_proj_error_sse4_1() 745 const __m128i fltl_xq = _mm_mullo_epi32(fltl, xq_active); in av1_highbd_pixel_proj_error_sse4_1() 746 const __m128i d0h_xq = _mm_mullo_epi32(d0h, xq_inactive); in av1_highbd_pixel_proj_error_sse4_1() 747 const __m128i d0l_xq = _mm_mullo_epi32(d0l, xq_inactive); in av1_highbd_pixel_proj_error_sse4_1()
|
D | highbd_temporal_filter_sse4.c | 37 dist_first = _mm_mullo_epi32(dist_first, dist_first); in highbd_store_dist_8() 38 dist_second = _mm_mullo_epi32(dist_second, dist_second); in highbd_store_dist_8() 109 *output = _mm_mullo_epi32(*output, weight_u32); in highbd_average_4()
|
/external/libaom/libaom/aom_dsp/x86/ |
D | convolve_sse4_1.h | 26 d = _mm_add_epi32(_mm_mullo_epi32(d, *wt0), _mm_mullo_epi32(*res, *wt1)); in mult_add_store() 41 const __m128i wt0_res = _mm_mullo_epi32(*data_ref_0, *wt0); in highbd_comp_avg_sse4_1() 42 const __m128i wt1_res = _mm_mullo_epi32(*res_unsigned, *wt1); in highbd_comp_avg_sse4_1()
|
D | obmc_intrinsic_sse4.h | 44 const __m128i v_sqrdiff_d = _mm_mullo_epi32(v_rdiff_d, v_rdiff_d); in obmc_variance_w4()
|
D | obmc_variance_sse4.c | 195 const __m128i v_sqrdiff_d = _mm_mullo_epi32(v_rdiff_d, v_rdiff_d); in hbd_obmc_variance_w4()
|
/external/libavc/common/x86/ |
D | ih264_ihadamard_scaling_sse42.c | 173 src_r0 = _mm_mullo_epi32(src_r0, mult_val); in ih264_ihadamard_scaling_4x4_sse42() 174 src_r1 = _mm_mullo_epi32(src_r1, mult_val); in ih264_ihadamard_scaling_4x4_sse42() 175 src_r2 = _mm_mullo_epi32(src_r2, mult_val); in ih264_ihadamard_scaling_4x4_sse42() 176 src_r3 = _mm_mullo_epi32(src_r3, mult_val); in ih264_ihadamard_scaling_4x4_sse42() 234 …temp0 = _mm_mullo_epi32(scale_val, plane_0); //multiply by pu2_iscal_mat[0] * pu2_weigh_mat… in ih264_ihadamard_scaling_2x2_uv_sse42() 235 …temp1 = _mm_mullo_epi32(scale_val, plane_1); //multiply by pu2_iscal_mat[0] * pu2_weigh_mat… in ih264_ihadamard_scaling_2x2_uv_sse42()
|
D | ih264_resi_trans_quant_sse42.c | 265 temp0 = _mm_mullo_epi32(temp0, src_r0); in ih264_resi_trans_quant_4x4_sse42() 266 temp1 = _mm_mullo_epi32(temp1, src_r1); in ih264_resi_trans_quant_4x4_sse42() 267 temp2 = _mm_mullo_epi32(temp2, src_r2); in ih264_resi_trans_quant_4x4_sse42() 268 temp3 = _mm_mullo_epi32(temp3, src_r3); in ih264_resi_trans_quant_4x4_sse42() 548 temp0 = _mm_mullo_epi32(temp0, src_r0); in ih264_resi_trans_quant_chroma_4x4_sse42() 549 temp1 = _mm_mullo_epi32(temp1, src_r1); in ih264_resi_trans_quant_chroma_4x4_sse42() 550 temp2 = _mm_mullo_epi32(temp2, src_r2); in ih264_resi_trans_quant_chroma_4x4_sse42() 551 temp3 = _mm_mullo_epi32(temp3, src_r3); in ih264_resi_trans_quant_chroma_4x4_sse42() 779 temp0 = _mm_mullo_epi32(scale_val, src_r0); //multiply by pu2_scale_matrix[0] in ih264_hadamard_quant_4x4_sse42() 780 temp1 = _mm_mullo_epi32(scale_val, src_r1); in ih264_hadamard_quant_4x4_sse42() [all …]
|
/external/libopus/celt/x86/ |
D | pitch_sse4_1.c | 92 inVec1_3210 = _mm_mullo_epi32(inVec1_3210, inVec2_3210); in celt_inner_prod_sse4_1() 169 sum0 = _mm_mullo_epi32(vecX0, vecY0); in xcorr_kernel_sse4_1() 170 sum1 = _mm_mullo_epi32(vecX1, vecY1); in xcorr_kernel_sse4_1() 171 sum2 = _mm_mullo_epi32(vecX2, vecY2); in xcorr_kernel_sse4_1() 172 sum3 = _mm_mullo_epi32(vecX3, vecY3); in xcorr_kernel_sse4_1() 187 sum0 = _mm_mullo_epi32(vecX0, vecY0); in xcorr_kernel_sse4_1()
|
/external/libopus/silk/fixed/x86/ |
D | burg_modified_FIX_sse4_1.c | 174 T1_3210 = _mm_mullo_epi32( PTR_3210, X1_3210 ); in silk_burg_modified_sse4_1() 175 T2_3210 = _mm_mullo_epi32( SUBFR_3210, X2_3210 ); in silk_burg_modified_sse4_1() 184 PTR_3210 = _mm_mullo_epi32( ATMP_3210, PTR_3210 ); in silk_burg_modified_sse4_1() 185 SUBFR_3210 = _mm_mullo_epi32( ATMP_3210, SUBFR_3210 ); in silk_burg_modified_sse4_1()
|
/external/clang/test/CodeGen/ |
D | sse41-builtins.c | 324 return _mm_mullo_epi32(x, y); in test_mm_mullo_epi32()
|
/external/libvpx/libvpx/vp9/encoder/x86/ |
D | vp9_diamond_search_sad_avx.c | 234 v_cost_d = _mm_mullo_epi32(v_cost_d, v_spb_d); in vp9_diamond_search_sad_avx()
|
/external/gemmlowp/fixedpoint/ |
D | fixedpoint_sse.h | 106 return _mm_mullo_epi32(a, b);
|
/external/clang/lib/Headers/ |
D | smmintrin.h | 122 _mm_mullo_epi32 (__m128i __V1, __m128i __V2) in _mm_mullo_epi32() function
|
/external/mesa3d/src/gallium/drivers/swr/rasterizer/core/ |
D | rasterizer_impl.h | 896 vAi = _mm_mullo_epi32(vAi, _mm_set1_epi32(-1)); 897 vBi = _mm_mullo_epi32(vBi, _mm_set1_epi32(-1));
|